<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of hal-04842482</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-22T23:57:51+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">ANTM: Aligned Neural Topic Models for Exploring Evolving Topics</title>
            <author role="aut">
              <persName>
                <forename type="first">Hamed</forename>
                <surname>Rahimi</surname>
              </persName>
              <email type="md5">30a83cb3dc6d0bfb308c36d0da56b632</email>
              <email type="domain">isir.upmc.fr</email>
              <idno type="idhal" notation="numeric">1505243</idno>
              <idno type="halauthorid" notation="string">2020742-1505243</idno>
              <idno type="IDREF">https://www.idref.fr/283103159</idno>
              <idno type="ORCID">https://orcid.org/0000-0001-9179-8625</idno>
              <affiliation ref="#struct-541715"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Hubert</forename>
                <surname>Naacke</surname>
              </persName>
              <email type="md5">fb2112a843a757bff27e0398b762ba0b</email>
              <email type="domain">lip6.fr</email>
              <idno type="idhal" notation="string">hubert-naacke</idno>
              <idno type="idhal" notation="numeric">9627</idno>
              <idno type="halauthorid" notation="string">9851-9627</idno>
              <idno type="ORCID">https://orcid.org/0000-0003-0559-9908</idno>
              <idno type="IDREF">https://www.idref.fr/06104203X</idno>
              <affiliation ref="#struct-541715"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Camelia</forename>
                <surname>Constantin</surname>
              </persName>
              <idno type="halauthorid">17775-0</idno>
              <affiliation ref="#struct-541715"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Bernd</forename>
                <surname>Amann</surname>
              </persName>
              <email type="md5">5ffc73d3de10460ec80fc861c8f18e8f</email>
              <email type="domain">lip6.fr</email>
              <idno type="idhal" notation="string">bernd-amann</idno>
              <idno type="idhal" notation="numeric">3057</idno>
              <idno type="halauthorid" notation="string">13288-3057</idno>
              <idno type="ORCID">https://orcid.org/0000-0002-6822-4049</idno>
              <idno type="GOOGLE SCHOLAR">https://scholar.google.com/citations?user=jKHvF80AAAAJ&amp;hl=en</idno>
              <idno type="IDREF">https://www.idref.fr/060259418</idno>
              <affiliation ref="#struct-541715"/>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Bernd</forename>
                <surname>Amann</surname>
              </persName>
              <email type="md5">5ffc73d3de10460ec80fc861c8f18e8f</email>
              <email type="domain">lip6.fr</email>
            </editor>
            <funder>SCAI - Sorbonne Université</funder>
          </titleStmt>
          <editionStmt>
            <edition n="v1" type="current">
              <date type="whenSubmitted">2024-12-17 10:58:29</date>
              <date type="whenModified">2025-10-11 15:34:29</date>
              <date type="whenReleased">2024-12-17 10:58:29</date>
              <date type="whenProduced">2024-07-21</date>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="192637">
                <persName>
                  <forename>Bernd</forename>
                  <surname>Amann</surname>
                </persName>
                <email type="md5">5ffc73d3de10460ec80fc861c8f18e8f</email>
                <email type="domain">lip6.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">hal-04842482</idno>
            <idno type="halUri">https://hal.sorbonne-universite.fr/hal-04842482</idno>
            <idno type="halBibtex">rahimi:hal-04842482</idno>
            <idno type="halRefHtml">Abdelkader Hameurlain; A Min Tjoa; Reza Akbarinia; Angela Bonifati. &lt;i&gt;Transactions on Large-Scale Data- and Knowledge-Centered Systems LVI: Special Issue on Data Management - Principles, Technologies, and Applications&lt;/i&gt;, 14790, Springer Berlin Heidelberg, pp.76-97, 2024, Lecture Notes in Computer Science (TLDKS), 978-3-662-69603-3. &lt;a target="_blank" href="https://dx.doi.org/10.1007/978-3-662-69603-3_3"&gt;&amp;#x27E8;10.1007/978-3-662-69603-3_3&amp;#x27E9;&lt;/a&gt;</idno>
            <idno type="halRef">Abdelkader Hameurlain; A Min Tjoa; Reza Akbarinia; Angela Bonifati. Transactions on Large-Scale Data- and Knowledge-Centered Systems LVI: Special Issue on Data Management - Principles, Technologies, and Applications, 14790, Springer Berlin Heidelberg, pp.76-97, 2024, Lecture Notes in Computer Science (TLDKS), 978-3-662-69603-3. &amp;#x27E8;10.1007/978-3-662-69603-3_3&amp;#x27E9;</idno>
            <availability status="restricted"/>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="LIP6" corresp="SORBONNE-UNIVERSITE">Laboratoire d'Informatique de Paris 6</idno>
            <idno type="stamp" n="SORBONNE-UNIVERSITE">Sorbonne Université</idno>
            <idno type="stamp" n="SORBONNE-UNIV" corresp="SORBONNE-UNIVERSITE">Sorbonne Université 01/01/2018</idno>
            <idno type="stamp" n="SU-SCIENCES" corresp="SORBONNE-UNIVERSITE">Faculté des Sciences de Sorbonne Université</idno>
            <idno type="stamp" n="ALLIANCE-SU"> Alliance Sorbonne Université</idno>
            <idno type="stamp" n="SUPRA_MATHS_INFO">Mathématiques + Informatique</idno>
          </seriesStmt>
          <notesStmt>
            <note type="audience" n="2">International</note>
            <note type="popular" n="0">No</note>
          </notesStmt>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">ANTM: Aligned Neural Topic Models for Exploring Evolving Topics</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Hamed</forename>
                    <surname>Rahimi</surname>
                  </persName>
                  <email type="md5">30a83cb3dc6d0bfb308c36d0da56b632</email>
                  <email type="domain">isir.upmc.fr</email>
                  <idno type="idhal" notation="numeric">1505243</idno>
                  <idno type="halauthorid" notation="string">2020742-1505243</idno>
                  <idno type="IDREF">https://www.idref.fr/283103159</idno>
                  <idno type="ORCID">https://orcid.org/0000-0001-9179-8625</idno>
                  <affiliation ref="#struct-541715"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Hubert</forename>
                    <surname>Naacke</surname>
                  </persName>
                  <email type="md5">fb2112a843a757bff27e0398b762ba0b</email>
                  <email type="domain">lip6.fr</email>
                  <idno type="idhal" notation="string">hubert-naacke</idno>
                  <idno type="idhal" notation="numeric">9627</idno>
                  <idno type="halauthorid" notation="string">9851-9627</idno>
                  <idno type="ORCID">https://orcid.org/0000-0003-0559-9908</idno>
                  <idno type="IDREF">https://www.idref.fr/06104203X</idno>
                  <affiliation ref="#struct-541715"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Camelia</forename>
                    <surname>Constantin</surname>
                  </persName>
                  <idno type="halauthorid">17775-0</idno>
                  <affiliation ref="#struct-541715"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Bernd</forename>
                    <surname>Amann</surname>
                  </persName>
                  <email type="md5">5ffc73d3de10460ec80fc861c8f18e8f</email>
                  <email type="domain">lip6.fr</email>
                  <idno type="idhal" notation="string">bernd-amann</idno>
                  <idno type="idhal" notation="numeric">3057</idno>
                  <idno type="halauthorid" notation="string">13288-3057</idno>
                  <idno type="ORCID">https://orcid.org/0000-0002-6822-4049</idno>
                  <idno type="GOOGLE SCHOLAR">https://scholar.google.com/citations?user=jKHvF80AAAAJ&amp;hl=en</idno>
                  <idno type="IDREF">https://www.idref.fr/060259418</idno>
                  <affiliation ref="#struct-541715"/>
                </author>
              </analytic>
              <monogr>
                <idno type="isbn">978-3-662-69603-3</idno>
                <title level="m">Transactions on Large-Scale Data- and Knowledge-Centered Systems LVI: Special Issue on Data Management - Principles, Technologies, and Applications</title>
                <editor>Abdelkader Hameurlain</editor>
                <editor>A Min Tjoa</editor>
                <editor>Reza Akbarinia</editor>
                <editor>Angela Bonifati</editor>
                <imprint>
                  <publisher>Springer Berlin Heidelberg</publisher>
                  <pubPlace>Berlin, Heidelberg</pubPlace>
                  <biblScope unit="serie">Lecture Notes in Computer Science (TLDKS)</biblScope>
                  <biblScope unit="volume">14790</biblScope>
                  <biblScope unit="pp">76-97</biblScope>
                  <date type="datePub">2024-07-21</date>
                </imprint>
              </monogr>
              <idno type="doi">10.1007/978-3-662-69603-3_3</idno>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <keywords scheme="author">
                <term xml:lang="en">Topic modelling</term>
                <term xml:lang="en">Text Analysis</term>
                <term xml:lang="en">Archive documents</term>
                <term xml:lang="en">Science evolution</term>
              </keywords>
              <classCode scheme="halDomain" n="info.info-db">Computer Science [cs]/Databases [cs.DB]</classCode>
              <classCode scheme="halDomain" n="info.info-tt">Computer Science [cs]/Document and Text Processing</classCode>
              <classCode scheme="halTypology" n="COUV">Book sections</classCode>
              <classCode scheme="halOldTypology" n="COUV">Book sections</classCode>
              <classCode scheme="halTreeTypology" n="COUV">Book sections</classCode>
            </textClass>
            <abstract xml:lang="en">
              <p>In today’s world, where the amount of textual information generated by humans and machines is rapidly growing, computational methods for organizing, summarizing, and tracking textual information and its evolution are becoming increasingly important. This paper introduces ANTM, an algorithmic family of dynamic topic models that combines novel techniques for discovering evolving topics in large corpora. ANTM preserves the temporal continuity of evolving topics by extracting temporal features from documents with advanced pre-trained large language models and by employing an overlapping sliding window algorithm for sequential aligned document clustering. This clustering method identifies different numbers of topics within each time frame and aligns semantically similar document clusters across time periods. It captures emerging and fading topics over time and allows for a more diverse and coherent representation of evolving topics. We evaluate ANTM against four other dynamic topic models on three datasets and conclude that it outperforms the state-of-the-art approaches in terms of interpretability and diversity. Furthermore, we demonstrate its effectiveness in handling large corpora, while improving the scalability and adaptability of dynamic topic models to different domains.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="researchteam" xml:id="struct-541715" status="VALID">
          <orgName>Bases de Données</orgName>
          <orgName type="acronym">BD</orgName>
          <date type="start">2008-01-01</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
          </desc>
          <listRelation>
            <relation active="#struct-541703" type="direct"/>
            <relation active="#struct-413221" type="indirect"/>
            <relation name="UMR7606" active="#struct-441569" type="indirect"/>
          </listRelation>
        </org>
        <org type="laboratory" xml:id="struct-541703" status="VALID">
          <idno type="IdRef">13558292X</idno>
          <idno type="RNSR">199712651U</idno>
          <idno type="ROR">https://ror.org/05krcen59</idno>
          <orgName>LIP6</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>4 Place JUSSIEU 75252 PARIS CEDEX 05</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.lip6.fr/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-413221" type="direct"/>
            <relation name="UMR7606" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="regroupinstitution" xml:id="struct-413221" status="VALID">
          <idno type="IdRef">221333754</idno>
          <idno type="ROR">https://ror.org/02en5vm52</idno>
          <orgName>Sorbonne Université</orgName>
          <orgName type="acronym">SU</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>21 rue de l’École de médecine - 75006 Paris</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.sorbonne-universite.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>