<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of lirmm-01169603</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-04T00:13:49+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">Data Partitioning for Fast Mining of Frequent Itemsets in Massively Distributed Environments</title>
            <author role="aut">
              <persName>
                <forename type="first">Saber</forename>
                <surname>Salah</surname>
              </persName>
              <email type="md5">39374a361f2222408fe6dcb39e325a43</email>
              <email type="domain">inria.fr</email>
              <idno type="idhal" notation="numeric">967928</idno>
              <idno type="halauthorid" notation="string">922189-967928</idno>
              <affiliation ref="#struct-141072"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Reza</forename>
                <surname>Akbarinia</surname>
              </persName>
              <email type="md5">521e1deee4724b1d0699efe11300ed33</email>
              <email type="domain">inria.fr</email>
              <idno type="idhal" notation="string">reza-akbarinia</idno>
              <idno type="idhal" notation="numeric">172647</idno>
              <idno type="halauthorid" notation="string">8354-172647</idno>
              <idno type="ORCID">https://orcid.org/0000-0002-7098-0361</idno>
              <idno type="IDREF">https://www.idref.fr/119863421</idno>
              <orgName ref="#struct-300009"/>
              <affiliation ref="#struct-141072"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Florent</forename>
                <surname>Masseglia</surname>
              </persName>
              <email type="md5">57004dd61ce7344cbd00f2bd70fc6ec2</email>
              <email type="domain">inria.fr</email>
              <idno type="idhal" notation="string">florent-masseglia</idno>
              <idno type="idhal" notation="numeric">172896</idno>
              <idno type="halauthorid" notation="string">17272-172896</idno>
              <idno type="ORCID">https://orcid.org/0000-0002-1149-585X</idno>
              <idno type="IDREF">https://www.idref.fr/120528681</idno>
              <orgName ref="#struct-300009"/>
              <affiliation ref="#struct-141072"/>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Florent</forename>
                <surname>Masseglia</surname>
              </persName>
              <email type="md5">2ebfe57879432a8eb507eec9cbc06284</email>
              <email type="domain">sophia.inria.fr</email>
            </editor>
          </titleStmt>
          <editionStmt>
            <edition n="v1" type="current">
              <date type="whenSubmitted">2015-06-29 18:29:28</date>
              <date type="whenModified">2025-08-26 15:21:01</date>
              <date type="whenReleased">2015-07-03 09:53:48</date>
              <date type="whenProduced">2015-09-01</date>
              <date type="whenEndEmbargoed">2015-07-03</date>
              <ref type="file" target="https://hal-lirmm.ccsd.cnrs.fr/lirmm-01169603v1/document">
                <date notBefore="2015-07-03"/>
              </ref>
              <ref type="file" subtype="author" n="1" target="https://hal-lirmm.ccsd.cnrs.fr/lirmm-01169603v1/file/dexa_salah.pdf" id="file-1169603-1257556">
                <date notBefore="2015-07-03"/>
              </ref>
              <ref type="externalLink" target="https://hal-lirmm.ccsd.cnrs.fr/lirmm-01169603/file/dexa_salah.pdf"/>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="137142">
                <persName>
                  <forename>Florent</forename>
                  <surname>Masseglia</surname>
                </persName>
                <email type="md5">2ebfe57879432a8eb507eec9cbc06284</email>
                <email type="domain">sophia.inria.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">lirmm-01169603</idno>
            <idno type="halUri">https://hal-lirmm.ccsd.cnrs.fr/lirmm-01169603</idno>
            <idno type="halBibtex">salah:lirmm-01169603</idno>
            <idno type="halRefHtml">&lt;i&gt;DEXA 2015 - 26th International Conference on Database and Expert Systems Applications&lt;/i&gt;, Sep 2015, Valencia, Spain. pp.303-318, &lt;a target="_blank" href="https://dx.doi.org/10.1007/978-3-319-22849-5_21"&gt;&amp;#x27E8;10.1007/978-3-319-22849-5_21&amp;#x27E9;&lt;/a&gt;</idno>
            <idno type="halRef">DEXA 2015 - 26th International Conference on Database and Expert Systems Applications, Sep 2015, Valencia, Spain. pp.303-318, &amp;#x27E8;10.1007/978-3-319-22849-5_21&amp;#x27E9;</idno>
            <availability status="restricted">
              <licence target="https://about.hal.science/hal-authorisation-v1/">HAL Authorization<ref corresp="#file-1169603-1257556"/></licence>
            </availability>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="INRIA">INRIA - Institut National de Recherche en Informatique et en Automatique</idno>
            <idno type="stamp" n="INRIA-SOPHIA">INRIA Sophia Antipolis - Méditerranée</idno>
            <idno type="stamp" n="INRIASO">INRIA-SOPHIA</idno>
            <idno type="stamp" n="INRIA_TEST">INRIA - Institut National de Recherche en Informatique et en Automatique</idno>
            <idno type="stamp" n="INRIA34">Antenne Inria de l'université de Montpellier</idno>
            <idno type="stamp" n="GRID5000">Grid'5000</idno>
            <idno type="stamp" n="TESTALAIN1">TESTALAIN1</idno>
            <idno type="stamp" n="ZENITH" corresp="LIRMM">Scientific Data Management</idno>
            <idno type="stamp" n="LIRMM">Laboratoire d'Informatique de Robotique et de Microélectronique de Montpellier</idno>
            <idno type="stamp" n="INRIA2">INRIA 2</idno>
            <idno type="stamp" n="MIPS">Mathématiques, Informatique, Physique et Systèmes</idno>
            <idno type="stamp" n="UNIV-MONTPELLIER">Université de Montpellier</idno>
            <idno type="stamp" n="UNIV-COTEDAZUR">Université Côte d'Azur</idno>
            <idno type="stamp" n="INRIA-300009">Inria 300009</idno>
            <idno type="stamp" n="UM-2015-2021" corresp="UNIV-MONTPELLIER">Université de Montpellier (2015-2021)</idno>
            <idno type="stamp" n="SLICES-FR">Publications from users of the SILECS research infrastructure</idno>
          </seriesStmt>
          <notesStmt>
            <note type="audience" n="2">International</note>
            <note type="invited" n="0">No</note>
            <note type="popular" n="0">No</note>
            <note type="peer" n="1">Yes</note>
            <note type="proceedings" n="1">Yes</note>
          </notesStmt>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">Data Partitioning for Fast Mining of Frequent Itemsets in Massively Distributed Environments</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Saber</forename>
                    <surname>Salah</surname>
                  </persName>
                  <email type="md5">39374a361f2222408fe6dcb39e325a43</email>
                  <email type="domain">inria.fr</email>
                  <idno type="idhal" notation="numeric">967928</idno>
                  <idno type="halauthorid" notation="string">922189-967928</idno>
                  <affiliation ref="#struct-141072"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Reza</forename>
                    <surname>Akbarinia</surname>
                  </persName>
                  <email type="md5">521e1deee4724b1d0699efe11300ed33</email>
                  <email type="domain">inria.fr</email>
                  <idno type="idhal" notation="string">reza-akbarinia</idno>
                  <idno type="idhal" notation="numeric">172647</idno>
                  <idno type="halauthorid" notation="string">8354-172647</idno>
                  <idno type="ORCID">https://orcid.org/0000-0002-7098-0361</idno>
                  <idno type="IDREF">https://www.idref.fr/119863421</idno>
                  <orgName ref="#struct-300009"/>
                  <affiliation ref="#struct-141072"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Florent</forename>
                    <surname>Masseglia</surname>
                  </persName>
                  <email type="md5">57004dd61ce7344cbd00f2bd70fc6ec2</email>
                  <email type="domain">inria.fr</email>
                  <idno type="idhal" notation="string">florent-masseglia</idno>
                  <idno type="idhal" notation="numeric">172896</idno>
                  <idno type="halauthorid" notation="string">17272-172896</idno>
                  <idno type="ORCID">https://orcid.org/0000-0002-1149-585X</idno>
                  <idno type="IDREF">https://www.idref.fr/120528681</idno>
                  <orgName ref="#struct-300009"/>
                  <affiliation ref="#struct-141072"/>
                </author>
              </analytic>
              <monogr>
                <meeting>
                  <title>DEXA 2015 - 26th International Conference on Database and Expert Systems Applications</title>
                  <date type="start">2015-09-01</date>
                  <date type="end">2015-09-04</date>
                  <settlement>Valencia</settlement>
                  <country key="ES">Spain</country>
                </meeting>
                <imprint>
                  <biblScope unit="volume">LNCS</biblScope>
                  <biblScope unit="issue">9261</biblScope>
                  <biblScope unit="pp">303-318</biblScope>
                  <date type="datePub">2015</date>
                </imprint>
              </monogr>
              <idno type="doi">10.1007/978-3-319-22849-5_21</idno>
              <ref type="publisher">http://www.dexa.org</ref>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <keywords scheme="author">
                <term xml:lang="en">Data Mining</term>
                <term xml:lang="en">Machine Learning</term>
                <term xml:lang="en">Frequent Itemset</term>
                <term xml:lang="en">MapReduce</term>
                <term xml:lang="en">Big Data</term>
              </keywords>
              <classCode scheme="halDomain" n="info.info-db">Computer Science [cs]/Databases [cs.DB]</classCode>
              <classCode scheme="halTypology" n="COMM">Conference papers</classCode>
              <classCode scheme="halOldTypology" n="COMM">Conference papers</classCode>
              <classCode scheme="halTreeTypology" n="COMM">Conference papers</classCode>
            </textClass>
            <abstract xml:lang="en">
              <p>Frequent itemset mining (FIM) is one of the fundamental cornerstones in data mining. While, the problem of FIM has been thoroughly studied, few of both standard and improved solutions scale. This is mainly the case when i) the amount of data tends to be very large and/or ii) the minimum support (M inSup) threshold is very low. In this paper, we propose a highly scalable, parallel frequent itemset mining (PFIM) algorithm, namely Parallel Absolute Top Down (PATD). PATD algorithm renders the mining process of very large databases (up to Ter-abytes of data) simple and compact. Its mining process is made up of only one parallel job, which dramatically reduces the mining runtime, the communication cost and the energy power consumption overhead, in a distributed computational platform. Based on a clever and efficient data partitioning strategy, namely Item Based Data Partitioning (IBDP), PATD algorithm mines each data partition independently , relying on an absolute minimum support (AM inSup) instead of a relative one. PATD has been extensively evaluated using real-world data sets. Our experimental results suggest that PATD algorithm is significantly more efficient and scalable than alternative approaches.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="researchteam" xml:id="struct-141072" status="OLD">
          <idno type="RNSR">201121208J</idno>
          <orgName>Scientific Data Management</orgName>
          <orgName type="acronym">ZENITH</orgName>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>LIRMM, 161 rue Ada, 34000 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://team.inria.fr/zenith/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-181" type="direct"/>
            <relation name="UMR5506" active="#struct-410122" type="indirect"/>
            <relation name="UMR5506" active="#struct-441569" type="indirect"/>
            <relation active="#struct-34586" type="direct"/>
            <relation active="#struct-300009" type="indirect"/>
          </listRelation>
        </org>
        <org type="laboratory" xml:id="struct-181" status="OLD">
          <idno type="IdRef">139590827</idno>
          <idno type="ISNI">0000000405990488</idno>
          <idno type="RNSR">199111950H</idno>
          <idno type="ROR">https://ror.org/013yean28</idno>
          <orgName>Laboratoire d'Informatique de Robotique et de Microélectronique de Montpellier</orgName>
          <orgName type="acronym">LIRMM</orgName>
          <date type="start">1995-01-01</date>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>161 rue Ada - 34095 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.lirmm.fr</ref>
          </desc>
          <listRelation>
            <relation name="UMR5506" active="#struct-410122" type="direct"/>
            <relation name="UMR5506" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="institution" xml:id="struct-410122" status="OLD">
          <idno type="ISNI">0000000120970141</idno>
          <idno type="ROR">https://ror.org/051escj72</idno>
          <orgName>Université de Montpellier</orgName>
          <orgName type="acronym">UM</orgName>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <addrLine>163 rue Auguste Broussonnet - 34090 Montpellier</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.umontpellier.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
        <org type="laboratory" xml:id="struct-34586" status="VALID">
          <idno type="RNSR">198318250R</idno>
          <idno type="ROR">https://ror.org/01nzkaw91</idno>
          <orgName>Centre Inria d'Université Côte d'Azur</orgName>
          <desc>
            <address>
              <addrLine>2004 route des Lucioles BP 93 06902 Sophia Antipolis</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.inria.fr/centre/sophia/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-300009" type="direct"/>
          </listRelation>
        </org>
        <org type="institution" xml:id="struct-300009" status="VALID">
          <idno type="ROR">https://ror.org/02kvxyf05</idno>
          <orgName>Institut National de Recherche en Informatique et en Automatique</orgName>
          <orgName type="acronym">Inria</orgName>
          <desc>
            <address>
              <addrLine>Domaine de VoluceauRocquencourt - BP 10578153 Le Chesnay Cedex</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.inria.fr/en/</ref>
          </desc>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>