<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of hal-04295228</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-24T19:40:45+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">Geo-Semantic Event-POI Matching of Large Mobility Datasets</title>
            <author role="aut">
              <persName>
                <forename type="first">Ndiouma</forename>
                <surname>Bame</surname>
              </persName>
              <idno type="halauthorid">937241-0</idno>
              <affiliation ref="#struct-1175215"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Ibrahima</forename>
                <surname>Gueye</surname>
              </persName>
              <idno type="halauthorid">246756-0</idno>
              <affiliation ref="#struct-217991"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Hubert</forename>
                <surname>Naacke</surname>
              </persName>
              <email type="md5">fb2112a843a757bff27e0398b762ba0b</email>
              <email type="domain">lip6.fr</email>
              <idno type="idhal" notation="string">hubert-naacke</idno>
              <idno type="idhal" notation="numeric">9627</idno>
              <idno type="halauthorid" notation="string">9851-9627</idno>
              <idno type="ORCID">https://orcid.org/0000-0003-0559-9908</idno>
              <idno type="IDREF">https://www.idref.fr/06104203X</idno>
              <affiliation ref="#struct-541715"/>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Hubert</forename>
                <surname>Naacke</surname>
              </persName>
              <email type="md5">fb2112a843a757bff27e0398b762ba0b</email>
              <email type="domain">lip6.fr</email>
            </editor>
          </titleStmt>
          <editionStmt>
            <edition n="v1" type="current">
              <date type="whenSubmitted">2023-11-20 12:07:21</date>
              <date type="whenModified">2024-10-30 13:32:32</date>
              <date type="whenReleased">2023-11-20 12:07:21</date>
              <date type="whenProduced">2023-07-11</date>
              <ref type="externalLink" target="https://doi.org/10.5220/0012132700003541"/>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="450218">
                <persName>
                  <forename>Hubert</forename>
                  <surname>Naacke</surname>
                </persName>
                <email type="md5">fb2112a843a757bff27e0398b762ba0b</email>
                <email type="domain">lip6.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">hal-04295228</idno>
            <idno type="halUri">https://hal.sorbonne-universite.fr/hal-04295228</idno>
            <idno type="halBibtex">bame:hal-04295228</idno>
            <idno type="halRefHtml">&lt;i&gt;12th International Conference on Data Science, Technology and Applications&lt;/i&gt;, Jul 2023, Rome, Italy. pp.496-503, &lt;a target="_blank" href="https://dx.doi.org/10.5220/0012132700003541"&gt;&amp;#x27E8;10.5220/0012132700003541&amp;#x27E9;&lt;/a&gt;</idno>
            <idno type="halRef">12th International Conference on Data Science, Technology and Applications, Jul 2023, Rome, Italy. pp.496-503, &amp;#x27E8;10.5220/0012132700003541&amp;#x27E9;</idno>
            <availability status="restricted"/>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="LIP6" corresp="SORBONNE-UNIVERSITE">Laboratoire d'Informatique de Paris 6</idno>
            <idno type="stamp" n="SORBONNE-UNIVERSITE">Sorbonne Université</idno>
            <idno type="stamp" n="SORBONNE-UNIV" corresp="SORBONNE-UNIVERSITE">Sorbonne Université 01/01/2018</idno>
            <idno type="stamp" n="SU-SCIENCES" corresp="SORBONNE-UNIVERSITE">Faculté des Sciences de Sorbonne Université</idno>
            <idno type="stamp" n="SU-TI">Sorbonne Université - Texte Intégral</idno>
            <idno type="stamp" n="ALLIANCE-SU"> Alliance Sorbonne Université</idno>
            <idno type="stamp" n="SUPRA_MATHS_INFO">Mathématiques + Informatique</idno>
          </seriesStmt>
          <notesStmt>
            <note type="audience" n="2">International</note>
            <note type="invited" n="0">No</note>
            <note type="popular" n="0">No</note>
            <note type="peer" n="1">Yes</note>
            <note type="proceedings" n="1">Yes</note>
          </notesStmt>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">Geo-Semantic Event-POI Matching of Large Mobility Datasets</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Ndiouma</forename>
                    <surname>Bame</surname>
                  </persName>
                  <idno type="halauthorid">937241-0</idno>
                  <affiliation ref="#struct-1175215"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Ibrahima</forename>
                    <surname>Gueye</surname>
                  </persName>
                  <idno type="halauthorid">246756-0</idno>
                  <affiliation ref="#struct-217991"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Hubert</forename>
                    <surname>Naacke</surname>
                  </persName>
                  <email type="md5">fb2112a843a757bff27e0398b762ba0b</email>
                  <email type="domain">lip6.fr</email>
                  <idno type="idhal" notation="string">hubert-naacke</idno>
                  <idno type="idhal" notation="numeric">9627</idno>
                  <idno type="halauthorid" notation="string">9851-9627</idno>
                  <idno type="ORCID">https://orcid.org/0000-0003-0559-9908</idno>
                  <idno type="IDREF">https://www.idref.fr/06104203X</idno>
                  <affiliation ref="#struct-541715"/>
                </author>
              </analytic>
              <monogr>
                <idno type="isbn">978-989-758-664-4</idno>
                <title level="m">Proceedings of the 12th International Conference on Data Science, Technology and Applications DATA</title>
                <meeting>
                  <title>12th International Conference on Data Science, Technology and Applications</title>
                  <date type="start">2023-07-11</date>
                  <date type="end">2023-07-13</date>
                  <settlement>Rome</settlement>
                  <country key="IT">Italy</country>
                </meeting>
                <imprint>
                  <publisher>SciTePress - Science and Technology Publications</publisher>
                  <biblScope unit="volume">1</biblScope>
                  <biblScope unit="pp">496-503</biblScope>
                  <date type="datePub">2023</date>
                </imprint>
              </monogr>
              <idno type="doi">10.5220/0012132700003541</idno>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <keywords scheme="author">
                <term xml:lang="en">Open data</term>
                <term xml:lang="en">sentence embedding</term>
                <term xml:lang="en">event-POI matching</term>
                <term xml:lang="en">semantic similarity</term>
                <term xml:lang="en">Geographic similarity</term>
              </keywords>
              <classCode scheme="https://dl.acm.org/ccs" n="ACM2012.H.2.2.0"/>
              <classCode scheme="https://dl.acm.org/ccs" n="ACM2012.H.2.7.0"/>
              <classCode scheme="https://dl.acm.org/ccs" n="ACM2012.H.2.7.4"/>
              <classCode scheme="halDomain" n="info.info-db">Computer Science [cs]/Databases [cs.DB]</classCode>
              <classCode scheme="halTypology" n="COMM">Conference papers</classCode>
              <classCode scheme="halOldTypology" n="COMM">Conference papers</classCode>
              <classCode scheme="halTreeTypology" n="COMM">Conference papers</classCode>
            </textClass>
            <abstract xml:lang="en">
              <p>Users often share data about their daily activities through social networks. These event data are very useful for a variety of uses cases such as  points of interest (POI) recommendation. However, event data often lack information about POIs.Thus, enriching event data with POI information is of upmost importance.This implies to know the POI in which an event took place before completing the data.We face the problem of aligning two types of data sources, event data and POI data, which is difficult because they do not have a common identifier or the same descriptive attributes.This work proposes and implements a complete methodology for the enrichment of a large dataset of geolocated data on user events with POI using both geographical and semantic properties.This effective methodology for matching POIs with geo-located events comprises four steps:(i) in a first step, we cross-reference the data using spatial proximity to define the geographical neighborhood of each event;(ii) in a second step, we define the semantic neighborhood of each event based on a threshold on the semantic similarity. The semantic similarity exploits events data  such as their contextual description and the tags by crossing them with those of the POI. (iii) these two types of similarity are combined for each POI of the event semantic neighborhood, to evaluate a geo-semantic similarity score;(iv) subsequently, each event is matched with the POI of the semantic neighborhood which maximizes the geo-semantic similarity score.We propose a robust modeling of our methodology and evaluate the effectiveness of our approach.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="institution" xml:id="struct-1175215" status="VALID">
          <idno type="ROR">https://ror.org/04je6yw13</idno>
          <orgName>Université Cheikh Anta Diop de Dakar [Sénégal]</orgName>
          <orgName type="acronym">UCAD</orgName>
          <date type="start">1987-01-01</date>
          <desc>
            <address>
              <addrLine>Université Cheikh Anta Diop de Dakar - Rectorat, BP 5005 Dakar-fann</addrLine>
              <country key="SN"/>
            </address>
            <ref type="url">https://www.ucad.sn/</ref>
          </desc>
        </org>
        <org type="institution" xml:id="struct-217991" status="VALID">
          <orgName>Ecole polytechnique de Thiès</orgName>
          <date type="start">1973-01-01</date>
          <desc>
            <address>
              <addrLine>Entrée de Thiès - BP A10 - Thiès</addrLine>
              <country key="SN"/>
            </address>
            <ref type="url">https://ept.sn/</ref>
          </desc>
        </org>
        <org type="researchteam" xml:id="struct-541715" status="VALID">
          <orgName>Bases de Données</orgName>
          <orgName type="acronym">BD</orgName>
          <date type="start">2008-01-01</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
          </desc>
          <listRelation>
            <relation active="#struct-541703" type="direct"/>
            <relation active="#struct-413221" type="indirect"/>
            <relation name="UMR7606" active="#struct-441569" type="indirect"/>
          </listRelation>
        </org>
        <org type="laboratory" xml:id="struct-541703" status="VALID">
          <idno type="IdRef">13558292X</idno>
          <idno type="RNSR">199712651U</idno>
          <idno type="ROR">https://ror.org/05krcen59</idno>
          <orgName>LIP6</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>4 Place JUSSIEU 75252 PARIS CEDEX 05</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.lip6.fr/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-413221" type="direct"/>
            <relation name="UMR7606" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="regroupinstitution" xml:id="struct-413221" status="VALID">
          <idno type="IdRef">221333754</idno>
          <idno type="ROR">https://ror.org/02en5vm52</idno>
          <orgName>Sorbonne Université</orgName>
          <orgName type="acronym">SU</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>21 rue de l’École de médecine - 75006 Paris</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.sorbonne-universite.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>