<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of hal-02063698</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-23T13:56:17+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">STOCHASTIC ADAPTIVE NEURAL ARCHITECTURE SEARCH FOR KEYWORD SPOTTING</title>
            <author role="aut">
              <persName>
                <forename type="first">Tom</forename>
                <surname>Véniat</surname>
              </persName>
              <email type="md5">9c9dda806e8c6cd7353f21a2a39e06d2</email>
              <email type="domain">lip6.fr</email>
              <idno type="idhal" notation="string">tom-veniat</idno>
              <idno type="idhal" notation="numeric">739051</idno>
              <idno type="halauthorid" notation="string">43953-739051</idno>
              <affiliation ref="#struct-541720"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Olivier</forename>
                <surname>Schwander</surname>
              </persName>
              <email type="md5">a40e1af959388c622090dcdda0f5b453</email>
              <email type="domain">sorbonne-universite.fr</email>
              <idno type="idhal" notation="string">olivier-schwander</idno>
              <idno type="idhal" notation="numeric">14377</idno>
              <idno type="halauthorid" notation="string">24156-14377</idno>
              <idno type="ORCID">https://orcid.org/0000-0003-0266-1585</idno>
              <idno type="IDREF">https://www.idref.fr/178639419</idno>
              <affiliation ref="#struct-541720"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Ludovic</forename>
                <surname>Denoyer</surname>
              </persName>
              <email type="md5">5a966f98d3670909f62ad2f0e0a0ec3f</email>
              <email type="domain">lip6.fr</email>
              <idno type="idhal" notation="string">ludovic-denoyer</idno>
              <idno type="idhal" notation="numeric">9178</idno>
              <idno type="halauthorid" notation="string">5171-9178</idno>
              <idno type="ORCID">https://orcid.org/0000-0002-7348-788X</idno>
              <idno type="IDREF">https://www.idref.fr/089291255</idno>
              <orgName ref="#struct-93591"/>
              <affiliation ref="#struct-541720"/>
              <affiliation ref="#struct-267305"/>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Olivier</forename>
                <surname>Schwander</surname>
              </persName>
              <email type="md5">a40e1af959388c622090dcdda0f5b453</email>
              <email type="domain">sorbonne-universite.fr</email>
            </editor>
            <funder ref="#projanr-41957"/>
          </titleStmt>
          <editionStmt>
            <edition n="v1" type="current">
              <date type="whenSubmitted">2019-03-11 13:49:44</date>
              <date type="whenModified">2024-10-30 13:33:03</date>
              <date type="whenReleased">2019-03-21 16:26:51</date>
              <date type="whenProduced">2019-05-12</date>
              <date type="whenEndEmbargoed">2019-03-11</date>
              <ref type="file" target="https://hal.sorbonne-universite.fr/hal-02063698v1/document">
                <date notBefore="2019-03-11"/>
              </ref>
              <ref type="file" subtype="author" n="1" target="https://hal.sorbonne-universite.fr/hal-02063698v1/file/ICASSP_2019.pdf" id="file-2063698-2066577">
                <date notBefore="2019-03-11"/>
              </ref>
              <ref type="externalLink" target="http://arxiv.org/pdf/1811.06753"/>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="190533">
                <persName>
                  <forename>Olivier</forename>
                  <surname>Schwander</surname>
                </persName>
                <email type="md5">a40e1af959388c622090dcdda0f5b453</email>
                <email type="domain">sorbonne-universite.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">hal-02063698</idno>
            <idno type="halUri">https://hal.sorbonne-universite.fr/hal-02063698</idno>
            <idno type="halBibtex">veniat:hal-02063698</idno>
            <idno type="halRefHtml">&lt;i&gt;ICASSP 2019 - International Conference on Acoustics, Speech, and Signal Processing&lt;/i&gt;, May 2019, Brighton, United Kingdom</idno>
            <idno type="halRef">ICASSP 2019 - International Conference on Acoustics, Speech, and Signal Processing, May 2019, Brighton, United Kingdom</idno>
            <availability status="restricted">
              <licence target="https://about.hal.science/hal-authorisation-v1/">HAL Authorization<ref corresp="#file-2063698-2066577"/></licence>
            </availability>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="LIP6" corresp="SORBONNE-UNIVERSITE">Laboratoire d'Informatique de Paris 6</idno>
            <idno type="stamp" n="SORBONNE-UNIVERSITE">Sorbonne Université</idno>
            <idno type="stamp" n="SORBONNE-UNIV" corresp="SORBONNE-UNIVERSITE">Sorbonne Université 01/01/2018</idno>
            <idno type="stamp" n="SU-SCIENCES" corresp="SORBONNE-UNIVERSITE">Faculté des Sciences de Sorbonne Université</idno>
            <idno type="stamp" n="TEST-HALCNRS">Collection test HAL CNRS</idno>
            <idno type="stamp" n="SU-TI">Sorbonne Université - Texte Intégral</idno>
            <idno type="stamp" n="ANR">ANR</idno>
            <idno type="stamp" n="ALLIANCE-SU"> Alliance Sorbonne Université</idno>
            <idno type="stamp" n="SUPRA_MATHS_INFO">Mathématiques + Informatique</idno>
          </seriesStmt>
          <notesStmt>
            <note type="audience" n="2">International</note>
            <note type="invited" n="0">No</note>
            <note type="popular" n="0">No</note>
            <note type="peer" n="1">Yes</note>
            <note type="proceedings" n="0">No</note>
          </notesStmt>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">STOCHASTIC ADAPTIVE NEURAL ARCHITECTURE SEARCH FOR KEYWORD SPOTTING</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Tom</forename>
                    <surname>Véniat</surname>
                  </persName>
                  <email type="md5">9c9dda806e8c6cd7353f21a2a39e06d2</email>
                  <email type="domain">lip6.fr</email>
                  <idno type="idhal" notation="string">tom-veniat</idno>
                  <idno type="idhal" notation="numeric">739051</idno>
                  <idno type="halauthorid" notation="string">43953-739051</idno>
                  <affiliation ref="#struct-541720"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Olivier</forename>
                    <surname>Schwander</surname>
                  </persName>
                  <email type="md5">a40e1af959388c622090dcdda0f5b453</email>
                  <email type="domain">sorbonne-universite.fr</email>
                  <idno type="idhal" notation="string">olivier-schwander</idno>
                  <idno type="idhal" notation="numeric">14377</idno>
                  <idno type="halauthorid" notation="string">24156-14377</idno>
                  <idno type="ORCID">https://orcid.org/0000-0003-0266-1585</idno>
                  <idno type="IDREF">https://www.idref.fr/178639419</idno>
                  <affiliation ref="#struct-541720"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Ludovic</forename>
                    <surname>Denoyer</surname>
                  </persName>
                  <email type="md5">5a966f98d3670909f62ad2f0e0a0ec3f</email>
                  <email type="domain">lip6.fr</email>
                  <idno type="idhal" notation="string">ludovic-denoyer</idno>
                  <idno type="idhal" notation="numeric">9178</idno>
                  <idno type="halauthorid" notation="string">5171-9178</idno>
                  <idno type="ORCID">https://orcid.org/0000-0002-7348-788X</idno>
                  <idno type="IDREF">https://www.idref.fr/089291255</idno>
                  <orgName ref="#struct-93591"/>
                  <affiliation ref="#struct-541720"/>
                  <affiliation ref="#struct-267305"/>
                </author>
              </analytic>
              <monogr>
                <meeting>
                  <title>ICASSP 2019 - International Conference on Acoustics, Speech, and Signal Processing</title>
                  <date type="start">2019-05-12</date>
                  <date type="end">2019-05-17</date>
                  <settlement>Brighton</settlement>
                  <country key="GB">United Kingdom</country>
                </meeting>
                <imprint>
                  <date type="datePub">2019</date>
                </imprint>
              </monogr>
              <idno type="arxiv">1811.06753</idno>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <keywords scheme="author">
                <term xml:lang="en">Budgeted Learning</term>
                <term xml:lang="en">Deep Learning</term>
                <term xml:lang="en">Keyword Spotting</term>
                <term xml:lang="en">Neural Architecture Search</term>
              </keywords>
              <classCode scheme="halDomain" n="info.info-lg">Computer Science [cs]/Machine Learning [cs.LG]</classCode>
              <classCode scheme="halDomain" n="info.info-ai">Computer Science [cs]/Artificial Intelligence [cs.AI]</classCode>
              <classCode scheme="halDomain" n="info.info-ts">Computer Science [cs]/Signal and Image Processing</classCode>
              <classCode scheme="halTypology" n="COMM">Conference papers</classCode>
              <classCode scheme="halOldTypology" n="COMM">Conference papers</classCode>
              <classCode scheme="halTreeTypology" n="COMM">Conference papers</classCode>
            </textClass>
            <abstract xml:lang="en">
              <p>The problem of keyword spotting i.e. identifying keywords in a real-time audio stream is mainly solved by applying a neural network over successive sliding windows. Due to the difficulty of the task, baseline models are usually large, resulting in a high computational cost and energy consumption level. We propose a new method called SANAS (Stochastic Adaptive Neural Architecture Search) which is able to adapt the architecture of the neural network on-the-fly at inference time such that small architectures will be used when the stream is easy to process (silence, low noise, ...) and bigger networks will be used when the task becomes more difficult. We show that this adaptive model can be learned end-to-end by optimizing a trade-off between the prediction performance and the average computational cost per unit of time. Experiments on the Speech Commands dataset [1] show that this approach leads to a high recognition level while being much faster (and/or energy saving) than classical approaches where the network architecture is static.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="researchteam" xml:id="struct-541720" status="OLD">
          <orgName>Machine Learning and Information Access</orgName>
          <orgName type="acronym">MLIA</orgName>
          <date type="start">2018-01-01</date>
          <date type="end">2021-12-31</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
          </desc>
          <listRelation>
            <relation active="#struct-541703" type="direct"/>
            <relation active="#struct-413221" type="indirect"/>
            <relation name="UMR7606" active="#struct-441569" type="indirect"/>
          </listRelation>
        </org>
        <org type="laboratory" xml:id="struct-267305" status="VALID">
          <orgName>Facebook AI Research [Paris]</orgName>
          <orgName type="acronym">FAIR</orgName>
          <desc>
            <address>
              <addrLine>Paris</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://research.facebook.com/ai</ref>
          </desc>
          <listRelation>
            <relation active="#struct-332252" type="direct"/>
          </listRelation>
        </org>
        <org type="laboratory" xml:id="struct-541703" status="VALID">
          <idno type="IdRef">13558292X</idno>
          <idno type="RNSR">199712651U</idno>
          <idno type="ROR">https://ror.org/05krcen59</idno>
          <orgName>LIP6</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>4 Place JUSSIEU 75252 PARIS CEDEX 05</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.lip6.fr/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-413221" type="direct"/>
            <relation name="UMR7606" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="regroupinstitution" xml:id="struct-413221" status="VALID">
          <idno type="IdRef">221333754</idno>
          <idno type="ROR">https://ror.org/02en5vm52</idno>
          <orgName>Sorbonne Université</orgName>
          <orgName type="acronym">SU</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>21 rue de l’École de médecine - 75006 Paris</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.sorbonne-universite.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
        <org type="institution" xml:id="struct-332252" status="VALID">
          <orgName>Facebook</orgName>
          <desc>
            <address>
              <country key="US"/>
            </address>
          </desc>
        </org>
      </listOrg>
      <listOrg type="projects">
        <org type="anrProject" xml:id="projanr-41957" status="VALID">
          <idno type="anr">ANR-16-CE23-0016</idno>
          <orgName>PAMELA</orgName>
          <desc>Apprentissage automatique décentralisé et personnalisé sous contraintes</desc>
          <date type="start">2016</date>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>