<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of hal-02505162</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-18T16:53:27+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">Contextual Bandits with Hidden Contexts: a Focused Data Capture From Social Media Streams</title>
            <author role="aut">
              <persName>
                <forename type="first">Sylvain</forename>
                <surname>Lamprier</surname>
              </persName>
              <email type="md5">942471cad263f780de2404e093709852</email>
              <email type="domain">yahoo.fr</email>
              <idno type="idhal" notation="string">sylvain-lamprier</idno>
              <idno type="idhal" notation="numeric">740402</idno>
              <idno type="halauthorid" notation="string">30958-740402</idno>
              <idno type="ORCID">https://orcid.org/0000-0002-2508-922X</idno>
              <idno type="IDREF">https://www.idref.fr/142632201</idno>
              <idno type="ISNI">http://isni.org/isni/0000000140859141</idno>
              <idno type="VIAF">https://viaf.org/viaf/200144138</idno>
              <idno type="RESEARCHERID">http://www.researcherid.com/rid/DYO-1764-2022</idno>
              <affiliation ref="#struct-541720"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Thibault</forename>
                <surname>Gisselbrecht</surname>
              </persName>
              <email type="md5">4c1f1af668abea9586f87f717bb17653</email>
              <email type="domain">SNIPS.AI</email>
              <idno type="idhal" notation="numeric">1044395</idno>
              <idno type="halauthorid" notation="string">1052454-1044395</idno>
              <affiliation ref="#struct-543507"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Patrick</forename>
                <surname>Gallinari</surname>
              </persName>
              <email type="md5">d928d788b4143b63dbc87c6175a152be</email>
              <email type="domain">sorbonne-universite.fr</email>
              <idno type="idhal" notation="string">patrick-gallinari</idno>
              <idno type="idhal" notation="numeric">751615</idno>
              <idno type="halauthorid" notation="string">1778-751615</idno>
              <idno type="ORCID">https://orcid.org/0000-0001-9060-9001</idno>
              <idno type="IDREF">https://www.idref.fr/070709076</idno>
              <idno type="RESEARCHERID">http://www.researcherid.com/rid/CSF-2807-2022</idno>
              <idno type="VIAF">https://viaf.org/viaf/6686337</idno>
              <idno type="RESEARCHERID">http://www.researcherid.com/rid/http://www.researcherid.com/rid/CSF-2807-2022</idno>
              <orgName ref="#struct-93591"/>
              <affiliation ref="#struct-541720"/>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Sylvain</forename>
                <surname>Lamprier</surname>
              </persName>
              <email type="md5">942471cad263f780de2404e093709852</email>
              <email type="domain">yahoo.fr</email>
            </editor>
          </titleStmt>
          <editionStmt>
            <edition n="v1" type="current">
              <date type="whenSubmitted">2020-03-11 11:54:29</date>
              <date type="whenModified">2024-10-30 13:33:34</date>
              <date type="whenReleased">2020-03-11 11:54:29</date>
              <date type="whenProduced">2019-11</date>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="143739">
                <persName>
                  <forename>Sylvain</forename>
                  <surname>Lamprier</surname>
                </persName>
                <email type="md5">942471cad263f780de2404e093709852</email>
                <email type="domain">yahoo.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">hal-02505162</idno>
            <idno type="halUri">https://hal.sorbonne-universite.fr/hal-02505162</idno>
            <idno type="halBibtex">lamprier:hal-02505162</idno>
            <idno type="halRefHtml">&lt;i&gt;Data Mining and Knowledge Discovery&lt;/i&gt;, 2019, 33, pp.1853-1893. &lt;a target="_blank" href="https://dx.doi.org/10.1007/s10618-019-00648-w"&gt;&amp;#x27E8;10.1007/s10618-019-00648-w&amp;#x27E9;&lt;/a&gt;</idno>
            <idno type="halRef">Data Mining and Knowledge Discovery, 2019, 33, pp.1853-1893. &amp;#x27E8;10.1007/s10618-019-00648-w&amp;#x27E9;</idno>
            <availability status="restricted"/>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="LIP6" corresp="SORBONNE-UNIVERSITE">Laboratoire d'Informatique de Paris 6</idno>
            <idno type="stamp" n="SORBONNE-UNIVERSITE">Sorbonne Université</idno>
            <idno type="stamp" n="SORBONNE-UNIV" corresp="SORBONNE-UNIVERSITE">Sorbonne Université 01/01/2018</idno>
            <idno type="stamp" n="SU-SCIENCES" corresp="SORBONNE-UNIVERSITE">Faculté des Sciences de Sorbonne Université</idno>
            <idno type="stamp" n="TEST-HALCNRS">Collection test HAL CNRS</idno>
            <idno type="stamp" n="ALLIANCE-SU"> Alliance Sorbonne Université</idno>
            <idno type="stamp" n="SUPRA_MATHS_INFO">Mathématiques + Informatique</idno>
          </seriesStmt>
          <notesStmt>
            <note type="audience" n="2">International</note>
            <note type="popular" n="0">No</note>
            <note type="peer" n="1">Yes</note>
          </notesStmt>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">Contextual Bandits with Hidden Contexts: a Focused Data Capture From Social Media Streams</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Sylvain</forename>
                    <surname>Lamprier</surname>
                  </persName>
                  <email type="md5">942471cad263f780de2404e093709852</email>
                  <email type="domain">yahoo.fr</email>
                  <idno type="idhal" notation="string">sylvain-lamprier</idno>
                  <idno type="idhal" notation="numeric">740402</idno>
                  <idno type="halauthorid" notation="string">30958-740402</idno>
                  <idno type="ORCID">https://orcid.org/0000-0002-2508-922X</idno>
                  <idno type="IDREF">https://www.idref.fr/142632201</idno>
                  <idno type="ISNI">http://isni.org/isni/0000000140859141</idno>
                  <idno type="VIAF">https://viaf.org/viaf/200144138</idno>
                  <idno type="RESEARCHERID">http://www.researcherid.com/rid/DYO-1764-2022</idno>
                  <affiliation ref="#struct-541720"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Thibault</forename>
                    <surname>Gisselbrecht</surname>
                  </persName>
                  <email type="md5">4c1f1af668abea9586f87f717bb17653</email>
                  <email type="domain">SNIPS.AI</email>
                  <idno type="idhal" notation="numeric">1044395</idno>
                  <idno type="halauthorid" notation="string">1052454-1044395</idno>
                  <affiliation ref="#struct-543507"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Patrick</forename>
                    <surname>Gallinari</surname>
                  </persName>
                  <email type="md5">d928d788b4143b63dbc87c6175a152be</email>
                  <email type="domain">sorbonne-universite.fr</email>
                  <idno type="idhal" notation="string">patrick-gallinari</idno>
                  <idno type="idhal" notation="numeric">751615</idno>
                  <idno type="halauthorid" notation="string">1778-751615</idno>
                  <idno type="ORCID">https://orcid.org/0000-0001-9060-9001</idno>
                  <idno type="IDREF">https://www.idref.fr/070709076</idno>
                  <idno type="RESEARCHERID">http://www.researcherid.com/rid/CSF-2807-2022</idno>
                  <idno type="VIAF">https://viaf.org/viaf/6686337</idno>
                  <idno type="RESEARCHERID">http://www.researcherid.com/rid/http://www.researcherid.com/rid/CSF-2807-2022</idno>
                  <orgName ref="#struct-93591"/>
                  <affiliation ref="#struct-541720"/>
                </author>
              </analytic>
              <monogr>
                <idno type="halJournalId" status="VALID">12470</idno>
                <idno type="issn">1384-5810</idno>
                <idno type="eissn">1573-756X</idno>
                <title level="j">Data Mining and Knowledge Discovery</title>
                <imprint>
                  <publisher>Springer</publisher>
                  <biblScope unit="serie">33</biblScope>
                  <biblScope unit="pp">1853-1893</biblScope>
                  <date type="datePub">2019-11</date>
                  <date type="dateEpub">2019-08</date>
                </imprint>
              </monogr>
              <idno type="doi">10.1007/s10618-019-00648-w</idno>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <classCode scheme="halDomain" n="info.info-ai">Computer Science [cs]/Artificial Intelligence [cs.AI]</classCode>
              <classCode scheme="halTypology" n="ART">Journal articles</classCode>
              <classCode scheme="halOldTypology" n="ART">Journal articles</classCode>
              <classCode scheme="halTreeTypology" n="ART">Journal articles</classCode>
            </textClass>
            <abstract xml:lang="en">
              <p>This paper addresses the problem of real time data capture from social media. Due to different limitations, it is not possible to collect all the data produced by social networks such as Twitter. Therefore, to be able to gather enough relevant information related to a predefined need, it is necessary to focus on a subset of the information sources. In this work, we focus on user-centered data capture and consider each account of a social network as a source that can be followed at each iteration of a data capture process. This process, whose aim is to maximize the cumulative utility of the captured information for the specified need, is constrained at each time step by the number of users that can be monitored simultaneously. The problem of selecting a subset of accounts to listen to over time is a sequential decision problem under constraints, which we formalize as a bandit problem with multiple selections. In this work, we propose a contextual UCB-like approach, that uses the activity of any user during the current step to predict his future behavior. Besides the capture of usefulness variations, considering contexts also enables to improve the efficiency of the process by leveraging some structure in the search space. However, existing contextual bandit approaches do not fit for our setting where most of the contexts are hidden from the agent. We therefore propose a new algorithm, called HiddenLinUCB, which aims at dealing with such missing information via variational inference. Experiments demonstrate the very good behavior of this approach compared to existing methods for tasks of data capture from social networks.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="researchteam" xml:id="struct-541720" status="OLD">
          <orgName>Machine Learning and Information Access</orgName>
          <orgName type="acronym">MLIA</orgName>
          <date type="start">2018-01-01</date>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
          </desc>
          <listRelation>
            <relation active="#struct-541703" type="direct"/>
            <relation active="#struct-413221" type="indirect"/>
            <relation name="UMR7606" active="#struct-441569" type="indirect"/>
          </listRelation>
        </org>
        <org type="institution" xml:id="struct-543507" status="INCOMING">
          <orgName>SNIPS</orgName>
          <desc>
            <address>
              <addrLine>Paris</addrLine>
              <country key="FR"/>
            </address>
          </desc>
        </org>
        <org type="laboratory" xml:id="struct-541703" status="VALID">
          <idno type="IdRef">13558292X</idno>
          <idno type="RNSR">199712651U</idno>
          <idno type="ROR">https://ror.org/05krcen59</idno>
          <orgName>LIP6</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>4 Place JUSSIEU 75252 PARIS CEDEX 05</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.lip6.fr/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-413221" type="direct"/>
            <relation name="UMR7606" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="regroupinstitution" xml:id="struct-413221" status="VALID">
          <idno type="IdRef">221333754</idno>
          <idno type="ROR">https://ror.org/02en5vm52</idno>
          <orgName>Sorbonne Université</orgName>
          <orgName type="acronym">SU</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>21 rue de l’École de médecine - 75006 Paris</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.sorbonne-universite.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>