<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of hal-02074907</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-17T21:51:06+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">Profile-Based Bandit with Unknown Profiles</title>
            <author role="aut">
              <persName>
                <forename type="first">Sylvain</forename>
                <surname>Lamprier</surname>
              </persName>
              <email type="md5">942471cad263f780de2404e093709852</email>
              <email type="domain">yahoo.fr</email>
              <idno type="idhal" notation="string">sylvain-lamprier</idno>
              <idno type="idhal" notation="numeric">740402</idno>
              <idno type="halauthorid" notation="string">30958-740402</idno>
              <idno type="ORCID">https://orcid.org/0000-0002-2508-922X</idno>
              <idno type="IDREF">https://www.idref.fr/142632201</idno>
              <idno type="ISNI">http://isni.org/isni/0000000140859141</idno>
              <idno type="VIAF">https://viaf.org/viaf/200144138</idno>
              <idno type="RESEARCHERID">http://www.researcherid.com/rid/DYO-1764-2022</idno>
              <affiliation ref="#struct-541720"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Thibault</forename>
                <surname>Gisselbrecht</surname>
              </persName>
              <email type="md5">4c1f1af668abea9586f87f717bb17653</email>
              <email type="domain">SNIPS.AI</email>
              <idno type="idhal" notation="numeric">1044395</idno>
              <idno type="halauthorid" notation="string">1052454-1044395</idno>
              <affiliation ref="#struct-543507"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Patrick</forename>
                <surname>Gallinari</surname>
              </persName>
              <email type="md5">d928d788b4143b63dbc87c6175a152be</email>
              <email type="domain">sorbonne-universite.fr</email>
              <idno type="idhal" notation="string">patrick-gallinari</idno>
              <idno type="idhal" notation="numeric">751615</idno>
              <idno type="halauthorid" notation="string">1778-751615</idno>
              <idno type="ORCID">https://orcid.org/0000-0001-9060-9001</idno>
              <idno type="IDREF">https://www.idref.fr/070709076</idno>
              <idno type="RESEARCHERID">http://www.researcherid.com/rid/CSF-2807-2022</idno>
              <idno type="VIAF">https://viaf.org/viaf/6686337</idno>
              <idno type="RESEARCHERID">http://www.researcherid.com/rid/http://www.researcherid.com/rid/CSF-2807-2022</idno>
              <orgName ref="#struct-93591"/>
              <affiliation ref="#struct-541720"/>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Sylvain</forename>
                <surname>Lamprier</surname>
              </persName>
              <email type="md5">942471cad263f780de2404e093709852</email>
              <email type="domain">yahoo.fr</email>
            </editor>
          </titleStmt>
          <editionStmt>
            <edition n="v1" type="current">
              <date type="whenSubmitted">2019-03-21 09:03:26</date>
              <date type="whenModified">2024-10-30 13:33:55</date>
              <date type="whenReleased">2019-03-21 09:03:26</date>
              <date type="whenProduced">2018</date>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="143739">
                <persName>
                  <forename>Sylvain</forename>
                  <surname>Lamprier</surname>
                </persName>
                <email type="md5">942471cad263f780de2404e093709852</email>
                <email type="domain">yahoo.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">hal-02074907</idno>
            <idno type="halUri">https://hal.sorbonne-universite.fr/hal-02074907</idno>
            <idno type="halBibtex">lamprier:hal-02074907</idno>
            <idno type="halRefHtml">&lt;i&gt;Journal of Machine Learning Research&lt;/i&gt;, 2018, 19 (53), pp.53:1--53:40</idno>
            <idno type="halRef">Journal of Machine Learning Research, 2018, 19 (53), pp.53:1--53:40</idno>
            <availability status="restricted"/>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="LIP6" corresp="SORBONNE-UNIVERSITE">Laboratoire d'Informatique de Paris 6</idno>
            <idno type="stamp" n="SORBONNE-UNIVERSITE">Sorbonne Université</idno>
            <idno type="stamp" n="SORBONNE-UNIV" corresp="SORBONNE-UNIVERSITE">Sorbonne Université 01/01/2018</idno>
            <idno type="stamp" n="SU-SCIENCES" corresp="SORBONNE-UNIVERSITE">Faculté des Sciences de Sorbonne Université</idno>
            <idno type="stamp" n="TEST-HALCNRS">Collection test HAL CNRS</idno>
            <idno type="stamp" n="ALLIANCE-SU"> Alliance Sorbonne Université</idno>
            <idno type="stamp" n="SUPRA_MATHS_INFO">Mathématiques + Informatique</idno>
          </seriesStmt>
          <notesStmt>
            <note type="audience" n="2">International</note>
            <note type="popular" n="0">No</note>
            <note type="peer" n="1">Yes</note>
          </notesStmt>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">Profile-Based Bandit with Unknown Profiles</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Sylvain</forename>
                    <surname>Lamprier</surname>
                  </persName>
                  <email type="md5">942471cad263f780de2404e093709852</email>
                  <email type="domain">yahoo.fr</email>
                  <idno type="idhal" notation="string">sylvain-lamprier</idno>
                  <idno type="idhal" notation="numeric">740402</idno>
                  <idno type="halauthorid" notation="string">30958-740402</idno>
                  <idno type="ORCID">https://orcid.org/0000-0002-2508-922X</idno>
                  <idno type="IDREF">https://www.idref.fr/142632201</idno>
                  <idno type="ISNI">http://isni.org/isni/0000000140859141</idno>
                  <idno type="VIAF">https://viaf.org/viaf/200144138</idno>
                  <idno type="RESEARCHERID">http://www.researcherid.com/rid/DYO-1764-2022</idno>
                  <affiliation ref="#struct-541720"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Thibault</forename>
                    <surname>Gisselbrecht</surname>
                  </persName>
                  <email type="md5">4c1f1af668abea9586f87f717bb17653</email>
                  <email type="domain">SNIPS.AI</email>
                  <idno type="idhal" notation="numeric">1044395</idno>
                  <idno type="halauthorid" notation="string">1052454-1044395</idno>
                  <affiliation ref="#struct-543507"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Patrick</forename>
                    <surname>Gallinari</surname>
                  </persName>
                  <email type="md5">d928d788b4143b63dbc87c6175a152be</email>
                  <email type="domain">sorbonne-universite.fr</email>
                  <idno type="idhal" notation="string">patrick-gallinari</idno>
                  <idno type="idhal" notation="numeric">751615</idno>
                  <idno type="halauthorid" notation="string">1778-751615</idno>
                  <idno type="ORCID">https://orcid.org/0000-0001-9060-9001</idno>
                  <idno type="IDREF">https://www.idref.fr/070709076</idno>
                  <idno type="RESEARCHERID">http://www.researcherid.com/rid/CSF-2807-2022</idno>
                  <idno type="VIAF">https://viaf.org/viaf/6686337</idno>
                  <idno type="RESEARCHERID">http://www.researcherid.com/rid/http://www.researcherid.com/rid/CSF-2807-2022</idno>
                  <orgName ref="#struct-93591"/>
                  <affiliation ref="#struct-541720"/>
                </author>
              </analytic>
              <monogr>
                <idno type="halJournalId" status="VALID">1472</idno>
                <idno type="issn">1532-4435</idno>
                <idno type="eissn">1533-7928</idno>
                <title level="j">Journal of Machine Learning Research</title>
                <imprint>
                  <publisher>Microtome Publishing</publisher>
                  <biblScope unit="volume">19</biblScope>
                  <biblScope unit="issue">53</biblScope>
                  <biblScope unit="pp">53:1--53:40</biblScope>
                  <date type="datePub">2018</date>
                </imprint>
              </monogr>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <classCode scheme="halDomain" n="info.info-ai">Computer Science [cs]/Artificial Intelligence [cs.AI]</classCode>
              <classCode scheme="halTypology" n="ART">Journal articles</classCode>
              <classCode scheme="halOldTypology" n="ART">Journal articles</classCode>
              <classCode scheme="halTreeTypology" n="ART">Journal articles</classCode>
            </textClass>
            <abstract xml:lang="en">
              <p>Stochastic bandits have been widely studied since decades. A very large panel of settings have been introduced, some of them for the inclusion of some structure between actions. If actions are associated with feature vectors that underlie their usefulness, the discovery of a mapping parameter between such profiles and rewards can help the exploration process of the bandit strategies. This is the setting studied in this paper, but in our case the action profiles (constant feature vectors) are unknown beforehand. Instead, the agent is only given sample vectors, with mean centered on the true profiles, for a subset of actions at each step of the process. In this new bandit instance, policies have thus to deal with a doubled uncertainty, both on the profile estimators and the reward mapping parameters learned so far. We propose a new algorithm, called \textit{SampLinUCB}, specifically designed for this case. Theoretical convergence guarantees are given for this strategy, according to various profile samples delivery scenarios. Finally, experiments are conducted on both artificial data and a task of focused data capture from online social networks. Obtained results demonstrate the relevance of the approach in various settings.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="researchteam" xml:id="struct-541720" status="OLD">
          <orgName>Machine Learning and Information Access</orgName>
          <orgName type="acronym">MLIA</orgName>
          <date type="start">2018-01-01</date>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
          </desc>
          <listRelation>
            <relation active="#struct-541703" type="direct"/>
            <relation active="#struct-413221" type="indirect"/>
            <relation name="UMR7606" active="#struct-441569" type="indirect"/>
          </listRelation>
        </org>
        <org type="institution" xml:id="struct-543507" status="INCOMING">
          <orgName>SNIPS</orgName>
          <desc>
            <address>
              <addrLine>Paris</addrLine>
              <country key="FR"/>
            </address>
          </desc>
        </org>
        <org type="laboratory" xml:id="struct-541703" status="VALID">
          <idno type="IdRef">13558292X</idno>
          <idno type="RNSR">199712651U</idno>
          <idno type="ROR">https://ror.org/05krcen59</idno>
          <orgName>LIP6</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>4 Place JUSSIEU 75252 PARIS CEDEX 05</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.lip6.fr/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-413221" type="direct"/>
            <relation name="UMR7606" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="regroupinstitution" xml:id="struct-413221" status="VALID">
          <idno type="IdRef">221333754</idno>
          <idno type="ROR">https://ror.org/02en5vm52</idno>
          <orgName>Sorbonne Université</orgName>
          <orgName type="acronym">SU</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>21 rue de l’École de médecine - 75006 Paris</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.sorbonne-universite.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>