<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of lirmm-03117453</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-22T14:36:56+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">RedOak: a reference-free and alignment-free structure for indexing a collection of similar genomes</title>
            <author role="aut">
              <persName>
                <forename type="first">Clément</forename>
                <surname>Agret</surname>
              </persName>
              <email type="md5">6ae57246ee27ff2ed4fff3d53e070d2e</email>
              <email type="domain">lirmm.fr</email>
              <idno type="idhal" notation="numeric">1211256</idno>
              <idno type="halauthorid" notation="string">1865818-1211256</idno>
              <idno type="ORCID">https://orcid.org/0000-0002-7404-7253</idno>
              <idno type="IDREF">https://www.idref.fr/250366339</idno>
              <affiliation ref="#struct-388224"/>
              <affiliation ref="#struct-1002398"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Annie</forename>
                <surname>Chateau</surname>
              </persName>
              <email type="md5">4c0e4613d8ee10ee4e1c98180000b379</email>
              <email type="domain">lirmm.fr</email>
              <idno type="idhal" notation="string">annie-chateau</idno>
              <idno type="idhal" notation="numeric">173624</idno>
              <idno type="halauthorid" notation="string">44100-173624</idno>
              <idno type="ORCID">https://orcid.org/0000-0003-4760-8171</idno>
              <idno type="IDREF">https://www.idref.fr/227798856</idno>
              <affiliation ref="#struct-388224"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Gaëtan</forename>
                <surname>Droc</surname>
              </persName>
              <email type="md5">e92d42b1804a1f1a5d30d17d92911a37</email>
              <email type="domain">cirad.fr</email>
              <idno type="idhal" notation="numeric">1213825</idno>
              <idno type="halauthorid" notation="string">446935-1213825</idno>
              <idno type="ORCID">https://orcid.org/0000-0003-1849-1269</idno>
              <idno type="IDREF">https://www.idref.fr/250355345</idno>
              <idno type="VIAF">https://viaf.org/viaf/168160789859202682279</idno>
              <affiliation ref="#struct-168219"/>
              <affiliation ref="#struct-1002398"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Gautier</forename>
                <surname>Sarah</surname>
              </persName>
              <email type="md5">e71b7a5c0f11d6867d9e84362c5403da</email>
              <email type="domain">inra.fr</email>
              <idno type="idhal" notation="string">gsarah</idno>
              <idno type="idhal" notation="numeric">1206554</idno>
              <idno type="halauthorid" notation="string">904889-1206554</idno>
              <idno type="ORCID">https://orcid.org/0000-0001-5179-972X</idno>
              <affiliation ref="#struct-1002398"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Alban</forename>
                <surname>Mancheron</surname>
              </persName>
              <email type="md5">ce3caf574b0e2c250ca57256ca29269e</email>
              <email type="domain">inria.fr</email>
              <idno type="idhal" notation="string">alban-mancheron</idno>
              <idno type="idhal" notation="numeric">6019</idno>
              <idno type="halauthorid" notation="string">17693-6019</idno>
              <idno type="ORCID">https://orcid.org/0000-0001-9249-7592</idno>
              <idno type="IDREF">https://www.idref.fr/111581362</idno>
              <affiliation ref="#struct-388224"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Manuel</forename>
                <surname>Ruiz</surname>
              </persName>
              <email type="md5">f4b91ca332ea2d8fb35219fde774db2f</email>
              <email type="domain">cirad.fr</email>
              <idno type="idhal" notation="numeric">1203055</idno>
              <idno type="halauthorid" notation="string">446941-1203055</idno>
              <idno type="ORCID">https://orcid.org/0000-0001-8153-276X</idno>
              <idno type="IDREF">https://www.idref.fr/069152543</idno>
              <affiliation ref="#struct-168219"/>
              <affiliation ref="#struct-1002398"/>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Alban</forename>
                <surname>Mancheron</surname>
              </persName>
              <email type="md5">6118fb5e940d1b1f5500c967a8327983</email>
              <email type="domain">lirmm.fr</email>
            </editor>
            <funder ref="#projanr-38027"/>
          </titleStmt>
          <editionStmt>
            <edition n="v1" type="current">
              <date type="whenSubmitted">2021-01-21 11:06:00</date>
              <date type="whenModified">2025-07-17 03:06:55</date>
              <date type="whenReleased">2021-01-21 12:45:24</date>
              <date type="whenProduced">2021-01-21</date>
              <date type="whenEndEmbargoed">2021-01-21</date>
              <ref type="file" target="https://hal-lirmm.ccsd.cnrs.fr/lirmm-03117453v1/document">
                <date notBefore="2021-01-21"/>
              </ref>
              <ref type="file" n="1" target="https://hal-lirmm.ccsd.cnrs.fr/lirmm-03117453v1/file/2020.12.19.423583v1.full.pdf" id="file-3117453-2730343">
                <date notBefore="2021-01-21"/>
              </ref>
              <ref type="externalLink" target="https://hal-lirmm.ccsd.cnrs.fr/lirmm-03117453/file/2020.12.19.423583v1.full.pdf"/>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="126020">
                <persName>
                  <forename>Alban</forename>
                  <surname>Mancheron</surname>
                </persName>
                <email type="md5">6118fb5e940d1b1f5500c967a8327983</email>
                <email type="domain">lirmm.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">lirmm-03117453</idno>
            <idno type="halUri">https://hal-lirmm.ccsd.cnrs.fr/lirmm-03117453</idno>
            <idno type="halBibtex">agret:lirmm-03117453</idno>
            <idno type="halRefHtml">2021</idno>
            <idno type="halRef">2021</idno>
            <availability status="restricted">
              <licence target="https://about.hal.science/hal-authorisation-v1/">HAL Authorization<ref corresp="#file-3117453-2730343"/></licence>
            </availability>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="CIRAD">CIRAD - Centre de coopération internationale en recherche agronomique pour le développement</idno>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="MAB" corresp="LIRMM">Méthodes et Algorithmes pour la Bioinformatique</idno>
            <idno type="stamp" n="LIRMM">Laboratoire d'Informatique de Robotique et de Microélectronique de Montpellier</idno>
            <idno type="stamp" n="AGREENIUM">Archive ouverte en agrobiosciences</idno>
            <idno type="stamp" n="MIPS">Mathématiques, Informatique, Physique et Systèmes</idno>
            <idno type="stamp" n="BA">Biologie-AgroSciences</idno>
            <idno type="stamp" n="UNIV-MONTPELLIER">Université de Montpellier</idno>
            <idno type="stamp" n="INSTITUT-AGRO-MONTPELLIER">Institut Agro Montpellier</idno>
            <idno type="stamp" n="INRAE">Institut National de Recherche en Agriculture, Alimentation et Environnement</idno>
            <idno type="stamp" n="INRAEOCCITANIEMONTPELLIER" corresp="INRAE">INRAE Occitanie Montpellier</idno>
            <idno type="stamp" n="ANR">ANR</idno>
            <idno type="stamp" n="AGAP">AGAP </idno>
            <idno type="stamp" n="UM-2015-2021" corresp="UNIV-MONTPELLIER">Université de Montpellier (2015-2021)</idno>
            <idno type="stamp" n="INSTITUT-AGRO">Institut Agro</idno>
            <idno type="stamp" n="BIOLOGIE_ET_AMELIORATION_DES_PLANTES">Département BAP INRAE</idno>
          </seriesStmt>
          <notesStmt/>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">RedOak: a reference-free and alignment-free structure for indexing a collection of similar genomes</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Clément</forename>
                    <surname>Agret</surname>
                  </persName>
                  <email type="md5">6ae57246ee27ff2ed4fff3d53e070d2e</email>
                  <email type="domain">lirmm.fr</email>
                  <idno type="idhal" notation="numeric">1211256</idno>
                  <idno type="halauthorid" notation="string">1865818-1211256</idno>
                  <idno type="ORCID">https://orcid.org/0000-0002-7404-7253</idno>
                  <idno type="IDREF">https://www.idref.fr/250366339</idno>
                  <affiliation ref="#struct-388224"/>
                  <affiliation ref="#struct-1002398"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Annie</forename>
                    <surname>Chateau</surname>
                  </persName>
                  <email type="md5">4c0e4613d8ee10ee4e1c98180000b379</email>
                  <email type="domain">lirmm.fr</email>
                  <idno type="idhal" notation="string">annie-chateau</idno>
                  <idno type="idhal" notation="numeric">173624</idno>
                  <idno type="halauthorid" notation="string">44100-173624</idno>
                  <idno type="ORCID">https://orcid.org/0000-0003-4760-8171</idno>
                  <idno type="IDREF">https://www.idref.fr/227798856</idno>
                  <affiliation ref="#struct-388224"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Gaëtan</forename>
                    <surname>Droc</surname>
                  </persName>
                  <email type="md5">e92d42b1804a1f1a5d30d17d92911a37</email>
                  <email type="domain">cirad.fr</email>
                  <idno type="idhal" notation="numeric">1213825</idno>
                  <idno type="halauthorid" notation="string">446935-1213825</idno>
                  <idno type="ORCID">https://orcid.org/0000-0003-1849-1269</idno>
                  <idno type="IDREF">https://www.idref.fr/250355345</idno>
                  <idno type="VIAF">https://viaf.org/viaf/168160789859202682279</idno>
                  <affiliation ref="#struct-168219"/>
                  <affiliation ref="#struct-1002398"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Gautier</forename>
                    <surname>Sarah</surname>
                  </persName>
                  <email type="md5">e71b7a5c0f11d6867d9e84362c5403da</email>
                  <email type="domain">inra.fr</email>
                  <idno type="idhal" notation="string">gsarah</idno>
                  <idno type="idhal" notation="numeric">1206554</idno>
                  <idno type="halauthorid" notation="string">904889-1206554</idno>
                  <idno type="ORCID">https://orcid.org/0000-0001-5179-972X</idno>
                  <affiliation ref="#struct-1002398"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Alban</forename>
                    <surname>Mancheron</surname>
                  </persName>
                  <email type="md5">ce3caf574b0e2c250ca57256ca29269e</email>
                  <email type="domain">inria.fr</email>
                  <idno type="idhal" notation="string">alban-mancheron</idno>
                  <idno type="idhal" notation="numeric">6019</idno>
                  <idno type="halauthorid" notation="string">17693-6019</idno>
                  <idno type="ORCID">https://orcid.org/0000-0001-9249-7592</idno>
                  <idno type="IDREF">https://www.idref.fr/111581362</idno>
                  <affiliation ref="#struct-388224"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Manuel</forename>
                    <surname>Ruiz</surname>
                  </persName>
                  <email type="md5">f4b91ca332ea2d8fb35219fde774db2f</email>
                  <email type="domain">cirad.fr</email>
                  <idno type="idhal" notation="numeric">1203055</idno>
                  <idno type="halauthorid" notation="string">446941-1203055</idno>
                  <idno type="ORCID">https://orcid.org/0000-0001-8153-276X</idno>
                  <idno type="IDREF">https://www.idref.fr/069152543</idno>
                  <affiliation ref="#struct-168219"/>
                  <affiliation ref="#struct-1002398"/>
                </author>
              </analytic>
              <monogr>
                <imprint/>
              </monogr>
              <idno type="doi">10.1101/2020.12.19.423583</idno>
              <ref target="https://gitlab.info-ufr.univ-montp2.fr/DoccY/RedOak" type="seeAlso"/>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <keywords scheme="author">
                <term xml:lang="en">Data structure</term>
                <term xml:lang="en">Similar genomes</term>
                <term xml:lang="en">Pan-genomes</term>
                <term xml:lang="en">k-mer</term>
              </keywords>
              <classCode scheme="halDomain" n="info.info-ds">Computer Science [cs]/Data Structures and Algorithms [cs.DS]</classCode>
              <classCode scheme="halTypology" n="UNDEFINED">Preprints, Working Papers, ...</classCode>
              <classCode scheme="halOldTypology" n="UNDEFINED">Preprints, Working Papers, ...</classCode>
              <classCode scheme="halTreeTypology" n="UNDEFINED">Preprints, Working Papers, ...</classCode>
            </textClass>
            <abstract xml:lang="en">
              <p>Background: As the cost of DNA sequencing decreases, high-throughput sequencing technologies become increasingly accessible to many laboratories. Consequently, new issues emerge that require new algorithms, including tools for indexing and compressing hundred to thousands of complete genomes.Results: This paper presents RedOak, a reference-free and alignment-free software package that allows for the indexing of a large collection of similar genomes. RedOak can also be applied to reads from unassembled genomes, and it provides a nucleotide sequence query function. This software is based on a k-mer approach and has been developed to be heavily parallelized and distributed on several nodes of a cluster. The source code of our RedOak algorithm is available at https://gitlab.info-ufr.univ-montp2.fr/DoccY/RedOak.Conclusions: RedOak may be really useful for biologists and bioinformaticians expecting to extract information from large sequence datasets.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="researchteam" xml:id="struct-388224" status="OLD">
          <orgName>Méthodes et Algorithmes pour la Bioinformatique</orgName>
          <orgName type="acronym">MAB</orgName>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>LIRMM, 161 rue Ada, 34000 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.lirmm.fr/equipes/MAB/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-181" type="direct"/>
            <relation name="UMR5506" active="#struct-410122" type="indirect"/>
            <relation name="UMR5506" active="#struct-441569" type="indirect"/>
          </listRelation>
        </org>
        <org type="laboratory" xml:id="struct-1002398" status="OLD">
          <idno type="ISNI">0000000404458705</idno>
          <idno type="RNSR">201119637B</idno>
          <idno type="ROR">https://ror.org/02w4exq36</idno>
          <orgName>Amélioration génétique et adaptation des plantes méditerranéennes et tropicales</orgName>
          <orgName type="acronym">UMR AGAP</orgName>
          <date type="start">2020-01-01</date>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>TA A-108 / 03 - Avenue Agropolis - 34398 Montpellier Cedex 5 France</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://umr-agap.cirad.fr</ref>
          </desc>
          <listRelation>
            <relation name="UMR108" active="#struct-11574" type="direct"/>
            <relation active="#struct-577435" type="direct"/>
            <relation active="#struct-1090073" type="direct"/>
            <relation active="#struct-1042499" type="indirect"/>
          </listRelation>
        </org>
        <org type="regrouplaboratory" xml:id="struct-168219" status="VALID">
          <orgName>Département Systèmes Biologiques</orgName>
          <orgName type="acronym">Cirad-BIOS</orgName>
          <date type="start">2007-01-01</date>
          <desc>
            <address>
              <addrLine>Avenue Agropolis TA A-DIR / 04 34398 Montpellier Cedex 5 France</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cirad.fr/qui-sommes-nous/organigramme/departements-scientifiques/systemes-biologiques-bios/presentation</ref>
          </desc>
          <listRelation>
            <relation active="#struct-11574" type="direct"/>
          </listRelation>
        </org>
        <org type="laboratory" xml:id="struct-181" status="OLD">
          <idno type="IdRef">139590827</idno>
          <idno type="ISNI">0000000405990488</idno>
          <idno type="RNSR">199111950H</idno>
          <idno type="ROR">https://ror.org/013yean28</idno>
          <orgName>Laboratoire d'Informatique de Robotique et de Microélectronique de Montpellier</orgName>
          <orgName type="acronym">LIRMM</orgName>
          <date type="start">1995-01-01</date>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>161 rue Ada - 34095 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.lirmm.fr</ref>
          </desc>
          <listRelation>
            <relation name="UMR5506" active="#struct-410122" type="direct"/>
            <relation name="UMR5506" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="institution" xml:id="struct-410122" status="OLD">
          <idno type="ISNI">0000000120970141</idno>
          <idno type="ROR">https://ror.org/051escj72</idno>
          <orgName>Université de Montpellier</orgName>
          <orgName type="acronym">UM</orgName>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>163 rue Auguste Broussonnet - 34090 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.umontpellier.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
        <org type="institution" xml:id="struct-11574" status="VALID">
          <idno type="ISNI">0000000121539871</idno>
          <idno type="ROR">https://ror.org/05kpkpg04</idno>
          <orgName>Centre de Coopération Internationale en Recherche Agronomique pour le Développement</orgName>
          <orgName type="acronym">Cirad</orgName>
          <date type="start">1984-06-01</date>
          <desc>
            <address>
              <addrLine>Siège 42, rue Scheffer 75116 Paris</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.cirad.fr</ref>
          </desc>
        </org>
        <org type="institution" xml:id="struct-577435" status="VALID">
          <idno type="ROR">https://ror.org/003vg9w96</idno>
          <orgName>Institut National de Recherche pour l’Agriculture, l’Alimentation et l’Environnement</orgName>
          <orgName type="acronym">INRAE</orgName>
          <date type="start">2020-01-01</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
          </desc>
        </org>
        <org type="institution" xml:id="struct-1090073" status="OLD">
          <idno type="IdRef">261038990</idno>
          <idno type="ROR">https://ror.org/03rnk6m14</idno>
          <orgName>Institut Agro - Montpellier SupAgro</orgName>
          <date type="start">2020-01-01</date>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>2, place Viala - Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.institut-agro-montpellier.fr/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-1042499" type="direct"/>
          </listRelation>
        </org>
        <org type="regroupinstitution" xml:id="struct-1042499" status="VALID">
          <idno type="IdRef">260373249</idno>
          <idno type="ROR">https://ror.org/01dkyve95</idno>
          <orgName>Institut national d'enseignement supérieur pour l'agriculture, l'alimentation et l'environnement</orgName>
          <orgName type="acronym">Institut Agro</orgName>
          <date type="start">2020-01-01</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.institut-agro.fr</ref>
          </desc>
        </org>
      </listOrg>
      <listOrg type="projects">
        <org type="anrProject" xml:id="projanr-38027" status="VALID">
          <idno type="anr">ANR-11-INBS-0013</idno>
          <idno type="program">Infrastructures</idno>
          <orgName>IFB (ex Renabi-IFB)</orgName>
          <desc>Institut français de bioinformatique</desc>
          <date type="start">2011</date>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>