<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of lirmm-00399025</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-22T15:00:38+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">Yet Another Matcher</title>
            <author role="aut">
              <persName>
                <forename type="first">Fabien</forename>
                <surname>Duchateau</surname>
              </persName>
              <email type="md5">4fd1487bfb494c92eaf81f11f8323534</email>
              <email type="domain">univ-lyon1.fr</email>
              <idno type="idhal" notation="string">fabien-duchateau</idno>
              <idno type="idhal" notation="numeric">4098</idno>
              <idno type="halauthorid" notation="string">25718-4098</idno>
              <idno type="IDREF">https://www.idref.fr/142567302</idno>
              <idno type="ORCID">https://orcid.org/0000-0001-6803-917X</idno>
              <affiliation ref="#struct-181"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Remi</forename>
                <surname>Coletta</surname>
              </persName>
              <email type="md5">21a13d656a64c68cb01c863661fb54bf</email>
              <email type="domain">lirmm.fr</email>
              <idno type="idhal" notation="numeric">932759</idno>
              <idno type="halauthorid" notation="string">672401-932759</idno>
              <affiliation ref="#struct-141072"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Zohra</forename>
                <surname>Bellahsene</surname>
              </persName>
              <email type="md5">1fa349bad174e06f69dc2df1883595bc</email>
              <email type="domain">lirmm.fr</email>
              <idno type="idhal" notation="string">zohra-bellahsene</idno>
              <idno type="idhal" notation="numeric">169913</idno>
              <idno type="halauthorid" notation="string">15690-169913</idno>
              <idno type="ORCID">https://orcid.org/0000-0003-2031-0519</idno>
              <idno type="IDREF">https://www.idref.fr/07917857X</idno>
              <affiliation ref="#struct-141072"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Renée</forename>
                <forename type="middle">J.</forename>
                <surname>Miller</surname>
              </persName>
              <email type="md5">76961a99796b071a8061fc461cf7dcd5</email>
              <email type="domain">gmail.com</email>
              <idno type="idhal" notation="numeric">861404</idno>
              <idno type="halauthorid" notation="string">402479-861404</idno>
              <affiliation ref="#struct-300722"/>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Fabien</forename>
                <surname>Duchateau</surname>
              </persName>
              <email type="md5">944bb28c4c920ffa0e24fa01aadcb951</email>
              <email type="domain">lirmm.fr</email>
            </editor>
          </titleStmt>
          <editionStmt>
            <edition n="v1" type="current">
              <date type="whenSubmitted">2010-06-25 07:00:05</date>
              <date type="whenModified">2025-08-26 15:21:01</date>
              <date type="whenReleased">2009-06-25 17:05:02</date>
              <date type="whenProduced">2009-06-05</date>
              <date type="whenEndEmbargoed">2010-06-25</date>
              <ref type="file" target="https://hal-lirmm.ccsd.cnrs.fr/lirmm-00399025v1/document">
                <date notBefore="2010-06-25"/>
              </ref>
              <ref type="file" subtype="author" n="1" target="https://hal-lirmm.ccsd.cnrs.fr/lirmm-00399025v1/file/CIKM2009_1245_53b101d9.pdf" id="file-399025-1067005">
                <date notBefore="2010-06-25"/>
              </ref>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="114409">
                <persName>
                  <forename>Fabien</forename>
                  <surname>Duchateau</surname>
                </persName>
                <email type="md5">944bb28c4c920ffa0e24fa01aadcb951</email>
                <email type="domain">lirmm.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">lirmm-00399025</idno>
            <idno type="halUri">https://hal-lirmm.ccsd.cnrs.fr/lirmm-00399025</idno>
            <idno type="halBibtex">duchateau:lirmm-00399025</idno>
            <idno type="halRefHtml">RR-09016, 2009</idno>
            <idno type="halRef">RR-09016, 2009</idno>
            <availability status="restricted">
              <licence target="https://about.hal.science/hal-authorisation-v1/">HAL Authorization<ref corresp="#file-399025-1067005"/></licence>
            </availability>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="INRIA">INRIA - Institut National de Recherche en Informatique et en Automatique</idno>
            <idno type="stamp" n="INRIA-SOPHIA">INRIA Sophia Antipolis - Méditerranée</idno>
            <idno type="stamp" n="INRIASO">INRIA-SOPHIA</idno>
            <idno type="stamp" n="INRIA_TEST">INRIA - Institut National de Recherche en Informatique et en Automatique</idno>
            <idno type="stamp" n="INRIA34">Antenne Inria de l'université de Montpellier</idno>
            <idno type="stamp" n="TESTALAIN1">TESTALAIN1</idno>
            <idno type="stamp" n="ZENITH" corresp="LIRMM">Scientific Data Management</idno>
            <idno type="stamp" n="LIRMM">Laboratoire d'Informatique de Robotique et de Microélectronique de Montpellier</idno>
            <idno type="stamp" n="INRIA2">INRIA 2</idno>
            <idno type="stamp" n="LARA">LARA</idno>
            <idno type="stamp" n="MIPS">Mathématiques, Informatique, Physique et Systèmes</idno>
            <idno type="stamp" n="LABEXIMU">Laboratoire d’Excellence Intelligences des Mondes Urbains</idno>
            <idno type="stamp" n="UNIV-MONTPELLIER">Université de Montpellier</idno>
            <idno type="stamp" n="UNIV-COTEDAZUR">Université Côte d'Azur</idno>
            <idno type="stamp" n="UM-2015-2021" corresp="UNIV-MONTPELLIER">Université de Montpellier (2015-2021)</idno>
            <idno type="stamp" n="INRIA-CANADA">INRIA-CANADA</idno>
          </seriesStmt>
          <notesStmt>
            <note type="audience" n="1">Not set</note>
          </notesStmt>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">Yet Another Matcher</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Fabien</forename>
                    <surname>Duchateau</surname>
                  </persName>
                  <email type="md5">4fd1487bfb494c92eaf81f11f8323534</email>
                  <email type="domain">univ-lyon1.fr</email>
                  <idno type="idhal" notation="string">fabien-duchateau</idno>
                  <idno type="idhal" notation="numeric">4098</idno>
                  <idno type="halauthorid" notation="string">25718-4098</idno>
                  <idno type="IDREF">https://www.idref.fr/142567302</idno>
                  <idno type="ORCID">https://orcid.org/0000-0001-6803-917X</idno>
                  <affiliation ref="#struct-181"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Remi</forename>
                    <surname>Coletta</surname>
                  </persName>
                  <email type="md5">21a13d656a64c68cb01c863661fb54bf</email>
                  <email type="domain">lirmm.fr</email>
                  <idno type="idhal" notation="numeric">932759</idno>
                  <idno type="halauthorid" notation="string">672401-932759</idno>
                  <affiliation ref="#struct-141072"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Zohra</forename>
                    <surname>Bellahsene</surname>
                  </persName>
                  <email type="md5">1fa349bad174e06f69dc2df1883595bc</email>
                  <email type="domain">lirmm.fr</email>
                  <idno type="idhal" notation="string">zohra-bellahsene</idno>
                  <idno type="idhal" notation="numeric">169913</idno>
                  <idno type="halauthorid" notation="string">15690-169913</idno>
                  <idno type="ORCID">https://orcid.org/0000-0003-2031-0519</idno>
                  <idno type="IDREF">https://www.idref.fr/07917857X</idno>
                  <affiliation ref="#struct-141072"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Renée</forename>
                    <forename type="middle">J.</forename>
                    <surname>Miller</surname>
                  </persName>
                  <email type="md5">76961a99796b071a8061fc461cf7dcd5</email>
                  <email type="domain">gmail.com</email>
                  <idno type="idhal" notation="numeric">861404</idno>
                  <idno type="halauthorid" notation="string">402479-861404</idno>
                  <affiliation ref="#struct-300722"/>
                </author>
              </analytic>
              <monogr>
                <idno type="reportNumber">RR-09016</idno>
                <imprint>
                  <date type="datePub">2009-06-05</date>
                </imprint>
              </monogr>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <keywords scheme="author">
                <term xml:lang="en">schema matching</term>
                <term xml:lang="en">data integration</term>
                <term xml:lang="en">matcher factory</term>
                <term xml:lang="en">machine learning</term>
                <term xml:lang="en">XML schemas</term>
              </keywords>
              <classCode scheme="halDomain" n="info.info-db">Computer Science [cs]/Databases [cs.DB]</classCode>
              <classCode scheme="halDomain" n="info.info-lg">Computer Science [cs]/Machine Learning [cs.LG]</classCode>
              <classCode scheme="halTypology" n="REPORT">Reports</classCode>
              <classCode scheme="halOldTypology" n="REPORT">Reports</classCode>
              <classCode scheme="halTreeTypology" n="REPORT">Reports</classCode>
            </textClass>
            <abstract xml:lang="en">
              <p>Discovering correspondences between schema elements is a crucial task for data integration. Most matching tools are semi-automatic, e.g. an expert must tune some parameters (thresholds, weights, etc.). They mainly use several methods to combine and aggregate similarity measures. However, their quality results often decrease when one requires to integrate a new similarity measure or when matching particular domain schemas. This paper describes YAM (Yet Another Matcher), which is a matcher factory. Indeed, it enables the generation of a dedicated matcher for a given schema matching scenario, according to user inputs. Our approach is based on machine learning since schema matchers can be seen as classifiers. Several bunches of experiments run against matchers generated by YAM and traditional matching tools show how our approach (i) is able to generate the best matcher for a given scenario and (ii) easily integrates user preferences, namely recall and precision tradeoff.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="laboratory" xml:id="struct-181" status="OLD">
          <idno type="IdRef">139590827</idno>
          <idno type="ISNI">0000000405990488</idno>
          <idno type="RNSR">199111950H</idno>
          <idno type="ROR">https://ror.org/013yean28</idno>
          <orgName>Laboratoire d'Informatique de Robotique et de Microélectronique de Montpellier</orgName>
          <orgName type="acronym">LIRMM</orgName>
          <date type="start">1995-01-01</date>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>161 rue Ada - 34095 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.lirmm.fr</ref>
          </desc>
          <listRelation>
            <relation name="UMR5506" active="#struct-410122" type="direct"/>
            <relation name="UMR5506" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="researchteam" xml:id="struct-141072" status="OLD">
          <idno type="RNSR">201121208J</idno>
          <orgName>Scientific Data Management</orgName>
          <orgName type="acronym">ZENITH</orgName>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>LIRMM, 161 rue Ada, 34000 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://team.inria.fr/zenith/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-181" type="direct"/>
            <relation name="UMR5506" active="#struct-410122" type="indirect"/>
            <relation name="UMR5506" active="#struct-441569" type="indirect"/>
            <relation active="#struct-34586" type="direct"/>
            <relation active="#struct-300009" type="indirect"/>
          </listRelation>
        </org>
        <org type="regroupinstitution" xml:id="struct-300722" status="VALID">
          <idno type="ROR">https://ror.org/03dbr7087</idno>
          <orgName>University of Toronto</orgName>
          <date type="start">1827-01-01</date>
          <desc>
            <address>
              <addrLine>27 King's College Circle, Toronto M5S 1A1</addrLine>
              <country key="CA"/>
            </address>
            <ref type="url">http://www.utoronto.ca/</ref>
          </desc>
        </org>
        <org type="institution" xml:id="struct-410122" status="OLD">
          <idno type="ISNI">0000000120970141</idno>
          <idno type="ROR">https://ror.org/051escj72</idno>
          <orgName>Université de Montpellier</orgName>
          <orgName type="acronym">UM</orgName>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>163 rue Auguste Broussonnet - 34090 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.umontpellier.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
        <org type="laboratory" xml:id="struct-34586" status="VALID">
          <idno type="RNSR">198318250R</idno>
          <idno type="ROR">https://ror.org/01nzkaw91</idno>
          <orgName>Centre Inria d'Université Côte d'Azur</orgName>
          <desc>
            <address>
              <addrLine>2004 route des Lucioles BP 93 06902 Sophia Antipolis</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.inria.fr/centre/sophia/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-300009" type="direct"/>
          </listRelation>
        </org>
        <org type="institution" xml:id="struct-300009" status="VALID">
          <idno type="ROR">https://ror.org/02kvxyf05</idno>
          <orgName>Institut National de Recherche en Informatique et en Automatique</orgName>
          <orgName type="acronym">Inria</orgName>
          <desc>
            <address>
              <addrLine>Domaine de VoluceauRocquencourt - BP 10578153 Le Chesnay Cedex</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.inria.fr/en/</ref>
          </desc>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>