<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of lirmm-00816292</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-24T01:27:50+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">Toward Geographic Information Harvesting: Extraction of Spatial Relational Facts from Web Documents</title>
            <title xml:lang="fr">Vers la récolte d'information géographique : extraction de relations spatiales à partir de documents Web</title>
            <author role="aut">
              <persName>
                <forename type="first">Corrado</forename>
                <surname>Loglisci</surname>
              </persName>
              <idno type="halauthorid">653526-0</idno>
              <affiliation ref="#struct-300766"/>
              <affiliation ref="#struct-568971"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Dino</forename>
                <surname>Ienco</surname>
              </persName>
              <email type="md5">b326eb4334c6ba52cdd2279add798afc</email>
              <email type="domain">inrae.fr</email>
              <idno type="idhal" notation="string">dino-ienco</idno>
              <idno type="idhal" notation="numeric">6226</idno>
              <idno type="halauthorid" notation="string">23855-6226</idno>
              <idno type="ORCID">https://orcid.org/0000-0002-8736-3132</idno>
              <idno type="IDREF">https://www.idref.fr/172688183</idno>
              <idno type="GOOGLE SCHOLAR">https://scholar.google.fr/citations?user=C8zfH3kAAAAJ</idno>
              <affiliation ref="#struct-568971"/>
              <affiliation ref="#struct-388310"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Mathieu</forename>
                <surname>Roche</surname>
              </persName>
              <email type="md5">f3369d939820713d626eff81740a4eeb</email>
              <email type="domain">cirad.fr</email>
              <idno type="idhal" notation="string">mathieu-roche</idno>
              <idno type="idhal" notation="numeric">4967</idno>
              <idno type="halauthorid" notation="string">20190-4967</idno>
              <idno type="IDREF">https://www.idref.fr/09042087X</idno>
              <idno type="ORCID">https://orcid.org/0000-0003-3272-8568</idno>
              <affiliation ref="#struct-568971"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Maguelonne</forename>
                <surname>Teisseire</surname>
              </persName>
              <email type="md5">bfed7f55123bad5a6ddc404f64f1a920</email>
              <email type="domain">teledetection.fr</email>
              <idno type="idhal" notation="string">maguelonne-teisseire</idno>
              <idno type="idhal" notation="numeric">8645</idno>
              <idno type="halauthorid" notation="string">24802-8645</idno>
              <idno type="ORCID">https://orcid.org/0000-0001-9313-6414</idno>
              <idno type="IDREF">https://www.idref.fr/117436593</idno>
              <idno type="VIAF">https://viaf.org/viaf/164498326</idno>
              <idno type="ISNI">http://isni.org/isni/0000000117179295</idno>
              <affiliation ref="#struct-388310"/>
              <affiliation ref="#struct-568971"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Donato</forename>
                <surname>Malerba</surname>
              </persName>
              <idno type="halauthorid">196402-0</idno>
              <affiliation ref="#struct-300766"/>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Mathieu</forename>
                <surname>Roche</surname>
              </persName>
              <email type="md5">db65d8027137d174ecf559fb797288b9</email>
              <email type="domain">cirad.fr</email>
            </editor>
          </titleStmt>
          <editionStmt>
            <edition n="v1" type="current">
              <date type="whenSubmitted">2013-04-21 13:56:11</date>
              <date type="whenModified">2025-03-21 15:14:31</date>
              <date type="whenReleased">2013-05-15 17:30:15</date>
              <date type="whenProduced">2012-12-10</date>
              <fs>
                <f name="inra_publicVise_local" notation="string" n="SC">
                  <string>inra_publicVise_local_SC</string>
                </f>
              </fs>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="114352">
                <persName>
                  <forename>Mathieu</forename>
                  <surname>Roche</surname>
                </persName>
                <email type="md5">db65d8027137d174ecf559fb797288b9</email>
                <email type="domain">cirad.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">lirmm-00816292</idno>
            <idno type="halUri">https://hal-lirmm.ccsd.cnrs.fr/lirmm-00816292</idno>
            <idno type="halBibtex">loglisci:lirmm-00816292</idno>
            <idno type="halRefHtml">&lt;i&gt;12th International Workshop on Spatial and Spatiotemporal Data Mining (SSTDM) @ ICDM&lt;/i&gt;, Dec 2012, Brussels, Belgium. pp.789-796, &lt;a target="_blank" href="https://dx.doi.org/10.1109/ICDMW.2012.20"&gt;&amp;#x27E8;10.1109/ICDMW.2012.20&amp;#x27E9;&lt;/a&gt;</idno>
            <idno type="halRef">12th International Workshop on Spatial and Spatiotemporal Data Mining (SSTDM) @ ICDM, Dec 2012, Brussels, Belgium. pp.789-796, &amp;#x27E8;10.1109/ICDMW.2012.20&amp;#x27E9;</idno>
            <availability status="restricted"/>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="CIRAD">CIRAD - Centre de coopération internationale en recherche agronomique pour le développement</idno>
            <idno type="stamp" n="AGROPARISTECH">AgroParisTech</idno>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="IRSTEA">IRSTEA - Institut national de recherche en sciences et technologies pour l'environnement et l'agriculture (&lt;b&gt;anciennement Cemagref&lt;/b&gt;)</idno>
            <idno type="stamp" n="LIRMM">Laboratoire d'Informatique de Robotique et de Microélectronique de Montpellier</idno>
            <idno type="stamp" n="AGROPOLIS">Agropolis</idno>
            <idno type="stamp" n="TETIS">TETIS</idno>
            <idno type="stamp" n="AGREENIUM">Archive ouverte en agrobiosciences</idno>
            <idno type="stamp" n="MIPS">Mathématiques, Informatique, Physique et Systèmes</idno>
            <idno type="stamp" n="UNIV-MONTPELLIER">Université de Montpellier</idno>
            <idno type="stamp" n="INRAE">Institut National de Recherche en Agriculture, Alimentation et Environnement</idno>
            <idno type="stamp" n="INRAEOCCITANIEMONTPELLIER" corresp="INRAE">INRAE Occitanie Montpellier</idno>
            <idno type="stamp" n="UM-2015-2021" corresp="UNIV-MONTPELLIER">Université de Montpellier (2015-2021)</idno>
            <idno type="stamp" n="MATHNUM">Département MathNum</idno>
            <idno type="stamp" n="TEST-MATHNUM">Test MathNum</idno>
          </seriesStmt>
          <notesStmt>
            <note type="commentary">[Departement_IRSTEA]Territoires [TR1_IRSTEA]SYNERGIE&lt;br/&gt;International Workshop on Spatial and Spatiotemporal Data Mining (SSTDM-12), In Cooperation with IEEE ICDM 2012, 10 December 2012, Brussels, Belgium</note>
            <note type="audience" n="2">International</note>
            <note type="invited" n="0">No</note>
            <note type="popular" n="0">No</note>
            <note type="peer" n="1">Yes</note>
            <note type="proceedings" n="1">Yes</note>
          </notesStmt>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">Toward Geographic Information Harvesting: Extraction of Spatial Relational Facts from Web Documents</title>
                <title xml:lang="fr">Vers la récolte d'information géographique : extraction de relations spatiales à partir de documents Web</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Corrado</forename>
                    <surname>Loglisci</surname>
                  </persName>
                  <idno type="halauthorid">653526-0</idno>
                  <affiliation ref="#struct-300766"/>
                  <affiliation ref="#struct-568971"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Dino</forename>
                    <surname>Ienco</surname>
                  </persName>
                  <email type="md5">b326eb4334c6ba52cdd2279add798afc</email>
                  <email type="domain">inrae.fr</email>
                  <idno type="idhal" notation="string">dino-ienco</idno>
                  <idno type="idhal" notation="numeric">6226</idno>
                  <idno type="halauthorid" notation="string">23855-6226</idno>
                  <idno type="ORCID">https://orcid.org/0000-0002-8736-3132</idno>
                  <idno type="IDREF">https://www.idref.fr/172688183</idno>
                  <idno type="GOOGLE SCHOLAR">https://scholar.google.fr/citations?user=C8zfH3kAAAAJ</idno>
                  <affiliation ref="#struct-568971"/>
                  <affiliation ref="#struct-388310"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Mathieu</forename>
                    <surname>Roche</surname>
                  </persName>
                  <email type="md5">f3369d939820713d626eff81740a4eeb</email>
                  <email type="domain">cirad.fr</email>
                  <idno type="idhal" notation="string">mathieu-roche</idno>
                  <idno type="idhal" notation="numeric">4967</idno>
                  <idno type="halauthorid" notation="string">20190-4967</idno>
                  <idno type="IDREF">https://www.idref.fr/09042087X</idno>
                  <idno type="ORCID">https://orcid.org/0000-0003-3272-8568</idno>
                  <affiliation ref="#struct-568971"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Maguelonne</forename>
                    <surname>Teisseire</surname>
                  </persName>
                  <email type="md5">bfed7f55123bad5a6ddc404f64f1a920</email>
                  <email type="domain">teledetection.fr</email>
                  <idno type="idhal" notation="string">maguelonne-teisseire</idno>
                  <idno type="idhal" notation="numeric">8645</idno>
                  <idno type="halauthorid" notation="string">24802-8645</idno>
                  <idno type="ORCID">https://orcid.org/0000-0001-9313-6414</idno>
                  <idno type="IDREF">https://www.idref.fr/117436593</idno>
                  <idno type="VIAF">https://viaf.org/viaf/164498326</idno>
                  <idno type="ISNI">http://isni.org/isni/0000000117179295</idno>
                  <affiliation ref="#struct-388310"/>
                  <affiliation ref="#struct-568971"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Donato</forename>
                    <surname>Malerba</surname>
                  </persName>
                  <idno type="halauthorid">196402-0</idno>
                  <affiliation ref="#struct-300766"/>
                </author>
              </analytic>
              <monogr>
                <idno type="isbn">978-076954925-5</idno>
                <meeting>
                  <title>12th International Workshop on Spatial and Spatiotemporal Data Mining (SSTDM) @ ICDM</title>
                  <date type="start">2012-12-10</date>
                  <settlement>Brussels</settlement>
                  <country key="BE">Belgium</country>
                </meeting>
                <imprint>
                  <biblScope unit="pp">789-796</biblScope>
                  <date type="datePub">2012</date>
                </imprint>
              </monogr>
              <idno type="doi">10.1109/ICDMW.2012.20</idno>
              <idno type="irstea">PUB00037620</idno>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <classCode scheme="halDomain" n="info.info-db">Computer Science [cs]/Databases [cs.DB]</classCode>
              <classCode scheme="halDomain" n="info.info-ir">Computer Science [cs]/Information Retrieval [cs.IR]</classCode>
              <classCode scheme="halDomain" n="info.info-wb">Computer Science [cs]/Web</classCode>
              <classCode scheme="vocinrae-old" n="INFORMATION GEOGRAPHIQUE">INFORMATION GEOGRAPHIQUE</classCode>
              <classCode scheme="vocinrae-old" n="WEB">WEB</classCode>
              <classCode scheme="vocinrae-old" n="SYSTEME D'INFORMATION A REFERENCE SPATIALE">SYSTEME D'INFORMATION A REFERENCE SPATIALE</classCode>
              <classCode scheme="vocinrae-old" n="SYSTEME D'INFORMATION GEOGRAPHIQUE">SYSTEME D'INFORMATION GEOGRAPHIQUE</classCode>
              <classCode scheme="vocinrae-old" n="GEOGRAPHIC INFORMATION">GEOGRAPHIC INFORMATION</classCode>
              <classCode scheme="vocinrae-old" n="WORLD WIDE WEB">WORLD WIDE WEB</classCode>
              <classCode scheme="vocinrae-old" n="GEOGRAPHICAL INFORMATION SYSTEMS">GEOGRAPHICAL INFORMATION SYSTEMS</classCode>
              <classCode scheme="halTypology" n="COMM">Conference papers</classCode>
              <classCode scheme="halOldTypology" n="COMM">Conference papers</classCode>
              <classCode scheme="halTreeTypology" n="COMM">Conference papers</classCode>
            </textClass>
            <abstract xml:lang="en">
              <p>This paper faces the problem of harvesting geographic information from Web documents, specifically, extracting facts on spatial relations among geographic places. The motivation is twofold. First, researchers on Spatial Data Mining often assume that spatial data are already available, thanks to current GIS and positioning technologies. Nevertheless, this is not applicable to the case of spatial information embedded in data without an explicit spatial modeling, such as documents. Second, despite the huge amount of Web documents conveying useful geographic information, there is not much work on how to harvest spatial data from these documents. The problem is particularly challenging because of the lack of annotated documents, which prevents the application of supervised learning techniques. In this paper, we propose to harvest facts on geographic places through an unsupervised approach which recognizes spatial relations among geographic places without supposing the availability of annotated documents. The proposed approach is based on the combined use of a spatial ontology and a prototype-based classifier. A case study on topological and directional relations is reported and commented.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="institution" xml:id="struct-300766" status="VALID">
          <idno type="ROR">https://ror.org/027ynra39</idno>
          <orgName>Università degli studi di Bari Aldo Moro = University of Bari Aldo Moro</orgName>
          <orgName type="acronym">UNIBA</orgName>
          <desc>
            <address>
              <addrLine>Piazza Umberto I - 70121 Bari</addrLine>
              <country key="IT"/>
            </address>
            <ref type="url">http://www.uniba.it/</ref>
          </desc>
        </org>
        <org type="laboratory" xml:id="struct-568971" status="OLD">
          <orgName>Territoires, Environnement, Télédétection et Information Spatiale</orgName>
          <orgName type="acronym">UMR TETIS</orgName>
          <date type="start">2012-01-01</date>
          <date type="end">2015-12-31</date>
          <desc>
            <address>
              <addrLine>Maison de la télédétection - 500 rue Jean-François Breton - 34093 Montpellier Cedex 5</addrLine>
              <country key="FR"/>
            </address>
          </desc>
          <listRelation>
            <relation active="#struct-11574" type="direct"/>
            <relation active="#struct-148117" type="direct"/>
            <relation name="UMR1470" active="#struct-302049" type="direct"/>
          </listRelation>
        </org>
        <org type="researchteam" xml:id="struct-388310" status="OLD">
          <orgName>Fouille de données environnementales</orgName>
          <orgName type="acronym">TATOO</orgName>
          <date type="end">2013</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
          </desc>
          <listRelation>
            <relation active="#struct-181" type="direct"/>
            <relation name="UMR5506" active="#struct-410122" type="indirect"/>
            <relation name="UMR5506" active="#struct-441569" type="indirect"/>
          </listRelation>
        </org>
        <org type="institution" xml:id="struct-11574" status="VALID">
          <idno type="ISNI">0000000121539871</idno>
          <idno type="ROR">https://ror.org/05kpkpg04</idno>
          <orgName>Centre de Coopération Internationale en Recherche Agronomique pour le Développement</orgName>
          <orgName type="acronym">Cirad</orgName>
          <date type="start">1984-06-01</date>
          <desc>
            <address>
              <addrLine>Siège 42, rue Scheffer 75116 Paris</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.cirad.fr</ref>
          </desc>
        </org>
        <org type="institution" xml:id="struct-148117" status="VALID">
          <idno type="IdRef">139408088</idno>
          <idno type="ROR">https://ror.org/02kbmgc12</idno>
          <orgName>AgroParisTech</orgName>
          <date type="start">2007-01-01</date>
          <desc>
            <address>
              <addrLine>22 place de l'Agronomie CS 20040 91123 Palaiseau cedex</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.agroparistech.fr/</ref>
          </desc>
        </org>
        <org type="institution" xml:id="struct-302049" status="OLD">
          <idno type="ROR">https://ror.org/01wep6g48</idno>
          <orgName>Institut national de recherche en sciences et technologies pour l'environnement et l'agriculture</orgName>
          <orgName type="acronym">IRSTEA</orgName>
          <date type="start">2012-01-01</date>
          <date type="end">2019-12-31</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.irstea.fr</ref>
          </desc>
        </org>
        <org type="laboratory" xml:id="struct-181" status="OLD">
          <idno type="IdRef">139590827</idno>
          <idno type="ISNI">0000000405990488</idno>
          <idno type="RNSR">199111950H</idno>
          <idno type="ROR">https://ror.org/013yean28</idno>
          <orgName>Laboratoire d'Informatique de Robotique et de Microélectronique de Montpellier</orgName>
          <orgName type="acronym">LIRMM</orgName>
          <date type="start">1995-01-01</date>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>161 rue Ada - 34095 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.lirmm.fr</ref>
          </desc>
          <listRelation>
            <relation name="UMR5506" active="#struct-410122" type="direct"/>
            <relation name="UMR5506" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="institution" xml:id="struct-410122" status="OLD">
          <idno type="ISNI">0000000120970141</idno>
          <idno type="ROR">https://ror.org/051escj72</idno>
          <orgName>Université de Montpellier</orgName>
          <orgName type="acronym">UM</orgName>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>163 rue Auguste Broussonnet - 34090 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.umontpellier.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>