<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of lirmm-01674319v2</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-03T04:05:29+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">Hierarchical Overlap Graph</title>
            <author role="aut">
              <persName>
                <forename type="first">Bastien</forename>
                <surname>Cazaux</surname>
              </persName>
              <email type="md5">9801dd5f380a8ef2148c88eb68f25fc8</email>
              <email type="domain">lirmm.fr</email>
              <idno type="idhal" notation="string">cazaux-bastien</idno>
              <idno type="idhal" notation="numeric">3129</idno>
              <idno type="halauthorid" notation="string">23494-3129</idno>
              <idno type="IDREF">https://www.idref.fr/226877523</idno>
              <affiliation ref="#struct-388224"/>
              <affiliation ref="#struct-1002368"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Eric</forename>
                <surname>Rivals</surname>
              </persName>
              <email type="md5">2948fa0e637f8fdead28884bcc311d7f</email>
              <email type="domain">lirmm.fr</email>
              <idno type="idhal" notation="string">eric-rivals</idno>
              <idno type="idhal" notation="numeric">2002</idno>
              <idno type="halauthorid" notation="string">23559-2002</idno>
              <idno type="ORCID">https://orcid.org/0000-0003-3791-3973</idno>
              <idno type="IDREF">https://www.idref.fr/118021850</idno>
              <affiliation ref="#struct-388224"/>
              <affiliation ref="#struct-1002368"/>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Eric</forename>
                <surname>Rivals</surname>
              </persName>
              <email type="md5">18b1a627af6df8b912fd128ee2d82dee</email>
              <email type="domain">lirmm.fr</email>
            </editor>
            <funder ref="#projanr-37873"/>
            <funder>Défi MASTODONS</funder>
          </titleStmt>
          <editionStmt>
            <edition n="v1">
              <date type="whenSubmitted">2018-01-02 12:29:03</date>
            </edition>
            <edition n="v2" type="current">
              <date type="whenSubmitted">2018-01-29 10:22:28</date>
              <date type="whenWritten">2017</date>
              <date type="whenModified">2025-03-23 03:12:47</date>
              <date type="whenReleased">2018-01-30 16:23:21</date>
              <date type="whenProduced">2020-03</date>
              <date type="whenEndEmbargoed">2018-01-29</date>
              <ref type="file" target="https://hal-lirmm.ccsd.cnrs.fr/lirmm-01674319v2/document">
                <date notBefore="2018-01-29"/>
              </ref>
              <ref type="file" subtype="author" n="1" target="https://hal-lirmm.ccsd.cnrs.fr/lirmm-01674319v2/file/hog-art.pdf" id="file-1695189-1737229">
                <date notBefore="2018-01-29"/>
              </ref>
              <ref type="externalLink" target="http://arxiv.org/pdf/1802.04632"/>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="113912">
                <persName>
                  <forename>Eric</forename>
                  <surname>Rivals</surname>
                </persName>
                <email type="md5">18b1a627af6df8b912fd128ee2d82dee</email>
                <email type="domain">lirmm.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">lirmm-01674319</idno>
            <idno type="halUri">https://hal-lirmm.ccsd.cnrs.fr/lirmm-01674319</idno>
            <idno type="halBibtex">cazaux:lirmm-01674319</idno>
            <idno type="halRefHtml">&lt;i&gt;Information Processing Letters&lt;/i&gt;, 2020, 155, pp.#105862. &lt;a target="_blank" href="https://dx.doi.org/10.1016/j.ipl.2019.105862"&gt;&amp;#x27E8;10.1016/j.ipl.2019.105862&amp;#x27E9;&lt;/a&gt;</idno>
            <idno type="halRef">Information Processing Letters, 2020, 155, pp.#105862. &amp;#x27E8;10.1016/j.ipl.2019.105862&amp;#x27E9;</idno>
            <availability status="restricted">
              <licence target="https://about.hal.science/hal-authorisation-v1/">HAL Authorization<ref corresp="#file-1695189-1737229"/></licence>
            </availability>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="MAB" corresp="LIRMM">Méthodes et Algorithmes pour la Bioinformatique</idno>
            <idno type="stamp" n="35792">SIFR</idno>
            <idno type="stamp" n="LIRMM">Laboratoire d'Informatique de Robotique et de Microélectronique de Montpellier</idno>
            <idno type="stamp" n="MIPS">Mathématiques, Informatique, Physique et Systèmes</idno>
            <idno type="stamp" n="UNIV-MONTPELLIER">Université de Montpellier</idno>
            <idno type="stamp" n="INRAE">Institut National de Recherche en Agriculture, Alimentation et Environnement</idno>
            <idno type="stamp" n="ANR">ANR</idno>
            <idno type="stamp" n="UM-2015-2021" corresp="UNIV-MONTPELLIER">Université de Montpellier (2015-2021)</idno>
          </seriesStmt>
          <notesStmt>
            <note type="audience" n="2">International</note>
            <note type="popular" n="0">No</note>
            <note type="peer" n="1">Yes</note>
          </notesStmt>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">Hierarchical Overlap Graph</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Bastien</forename>
                    <surname>Cazaux</surname>
                  </persName>
                  <email type="md5">9801dd5f380a8ef2148c88eb68f25fc8</email>
                  <email type="domain">lirmm.fr</email>
                  <idno type="idhal" notation="string">cazaux-bastien</idno>
                  <idno type="idhal" notation="numeric">3129</idno>
                  <idno type="halauthorid" notation="string">23494-3129</idno>
                  <idno type="IDREF">https://www.idref.fr/226877523</idno>
                  <affiliation ref="#struct-388224"/>
                  <affiliation ref="#struct-1002368"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Eric</forename>
                    <surname>Rivals</surname>
                  </persName>
                  <email type="md5">2948fa0e637f8fdead28884bcc311d7f</email>
                  <email type="domain">lirmm.fr</email>
                  <idno type="idhal" notation="string">eric-rivals</idno>
                  <idno type="idhal" notation="numeric">2002</idno>
                  <idno type="halauthorid" notation="string">23559-2002</idno>
                  <idno type="ORCID">https://orcid.org/0000-0003-3791-3973</idno>
                  <idno type="IDREF">https://www.idref.fr/118021850</idno>
                  <affiliation ref="#struct-388224"/>
                  <affiliation ref="#struct-1002368"/>
                </author>
              </analytic>
              <monogr>
                <idno type="halJournalId" status="VALID">14186</idno>
                <idno type="issn">0020-0190</idno>
                <title level="j">Information Processing Letters</title>
                <imprint>
                  <publisher>Elsevier</publisher>
                  <biblScope unit="volume">155</biblScope>
                  <biblScope unit="pp">#105862</biblScope>
                  <date type="datePub">2020-03</date>
                </imprint>
              </monogr>
              <idno type="doi">10.1016/j.ipl.2019.105862</idno>
              <ref target="http://www.lirmm.fr/ ̃rivals/res/superstring/hog-art-appendix.pdf" type="seeAlso"/>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <keywords scheme="author">
                <term xml:lang="en">APSP</term>
                <term xml:lang="en">stringology</term>
                <term xml:lang="en">prefix</term>
                <term xml:lang="en">digraph</term>
                <term xml:lang="en">assembly</term>
                <term xml:lang="en">overlap graph</term>
                <term xml:lang="en">suffix</term>
                <term xml:lang="en">superstring</term>
                <term xml:lang="en">greedy</term>
                <term xml:lang="en">Aho-Corasik</term>
              </keywords>
              <classCode scheme="acm" n="F.2.2">F.: Theory of Computation/F.2: ANALYSIS OF ALGORITHMS AND PROBLEM COMPLEXITY/F.2.2: Nonnumerical Algorithms and Problems</classCode>
              <classCode scheme="halDomain" n="info.info-ds">Computer Science [cs]/Data Structures and Algorithms [cs.DS]</classCode>
              <classCode scheme="halDomain" n="info.info-bi">Computer Science [cs]/Bioinformatics [q-bio.QM]</classCode>
              <classCode scheme="halTypology" n="ART">Journal articles</classCode>
              <classCode scheme="halOldTypology" n="ART">Journal articles</classCode>
              <classCode scheme="halTreeTypology" n="ART">Journal articles</classCode>
            </textClass>
            <abstract xml:lang="fr">
              <p>Given a set of finite words, the Overlap Graph (OG) is a complete weighted digraph where each word is a node and where the weight of an arc equals the length of the longest overlap of one word onto the other (Overlap is an asymmetric notion). The OG serves to assemble DNA fragments or to compute shortest superstrings, which are a compressed representation of the input. The OG requires space that is quadratic in the number of words, which limits its scalability. The Hierarchical Overlap Graph (HOG) is an alternative graph that also encodes all maximal overlaps, but uses space that is linear in the sum of the lengths of the input words. We propose the first algorithm to build the HOG in linear space for words of equal length.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="researchteam" xml:id="struct-388224" status="OLD">
          <orgName>Méthodes et Algorithmes pour la Bioinformatique</orgName>
          <orgName type="acronym">MAB</orgName>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>LIRMM, 161 rue Ada, 34000 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.lirmm.fr/equipes/MAB/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-181" type="direct"/>
            <relation name="UMR5506" active="#struct-410122" type="indirect"/>
            <relation name="UMR5506" active="#struct-441569" type="indirect"/>
          </listRelation>
        </org>
        <org type="laboratory" xml:id="struct-1002368" status="OLD">
          <orgName>Institut de Biologie Computationnelle</orgName>
          <orgName type="acronym">IBC</orgName>
          <date type="start">2020-01-01</date>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>95 rue de la Galéra, 34095 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.ibc-montpellier.fr/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-300009" type="direct"/>
            <relation active="#struct-410122" type="direct"/>
            <relation active="#struct-441569" type="direct"/>
            <relation active="#struct-577435" type="direct"/>
          </listRelation>
        </org>
        <org type="laboratory" xml:id="struct-181" status="OLD">
          <idno type="IdRef">139590827</idno>
          <idno type="ISNI">0000000405990488</idno>
          <idno type="RNSR">199111950H</idno>
          <idno type="ROR">https://ror.org/013yean28</idno>
          <orgName>Laboratoire d'Informatique de Robotique et de Microélectronique de Montpellier</orgName>
          <orgName type="acronym">LIRMM</orgName>
          <date type="start">1995-01-01</date>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>161 rue Ada - 34095 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.lirmm.fr</ref>
          </desc>
          <listRelation>
            <relation name="UMR5506" active="#struct-410122" type="direct"/>
            <relation name="UMR5506" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="institution" xml:id="struct-410122" status="OLD">
          <idno type="ISNI">0000000120970141</idno>
          <idno type="ROR">https://ror.org/051escj72</idno>
          <orgName>Université de Montpellier</orgName>
          <orgName type="acronym">UM</orgName>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>163 rue Auguste Broussonnet - 34090 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.umontpellier.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
        <org type="institution" xml:id="struct-300009" status="VALID">
          <idno type="ROR">https://ror.org/02kvxyf05</idno>
          <orgName>Institut National de Recherche en Informatique et en Automatique</orgName>
          <orgName type="acronym">Inria</orgName>
          <desc>
            <address>
              <addrLine>Domaine de VoluceauRocquencourt - BP 10578153 Le Chesnay Cedex</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.inria.fr/en/</ref>
          </desc>
        </org>
        <org type="institution" xml:id="struct-577435" status="VALID">
          <idno type="ROR">https://ror.org/003vg9w96</idno>
          <orgName>Institut National de Recherche pour l’Agriculture, l’Alimentation et l’Environnement</orgName>
          <orgName type="acronym">INRAE</orgName>
          <date type="start">2020-01-01</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
          </desc>
        </org>
      </listOrg>
      <listOrg type="projects">
        <org type="anrProject" xml:id="projanr-37873" status="VALID">
          <idno type="anr">ANR-11-BINF-0002</idno>
          <idno type="program">Bio-informatique</idno>
          <orgName>IBC</orgName>
          <desc>Institut de biologie Computationnelle</desc>
          <date type="start">2011</date>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>