<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of hal-03721718</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-21T23:48:55+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">Assessing Representation Learning and Clustering Algorithms for Computer-Assisted Image Annotation—Simulating and Benchmarking MorphoCluster</title>
            <author role="aut">
              <persName>
                <forename type="first">Simon-Martin</forename>
                <surname>Schröder</surname>
              </persName>
              <idno type="idhal" notation="numeric">793252</idno>
              <idno type="halauthorid" notation="string">1460801-793252</idno>
              <idno type="ORCID">https://orcid.org/0000-0002-6603-9907</idno>
              <affiliation ref="#struct-462123"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Rainer</forename>
                <surname>Kiko</surname>
              </persName>
              <email type="md5">f718f12965718abc39e7108e14625fe2</email>
              <email type="domain">obs-vlfr.fr</email>
              <idno type="idhal" notation="string">rainer-kiko</idno>
              <idno type="idhal" notation="numeric">1149536</idno>
              <idno type="halauthorid" notation="string">963441-1149536</idno>
              <idno type="ORCID">https://orcid.org/0000-0002-7851-9107</idno>
              <idno type="IDREF">https://www.idref.fr/276034236</idno>
              <idno type="GOOGLE SCHOLAR">https://scholar.google.fr/citations?user=5cGQZcYAAAAJ</idno>
              <affiliation ref="#struct-541740"/>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Rainer</forename>
                <surname>Kiko</surname>
              </persName>
              <email type="md5">75b1f44c307197be66b6f6995f204323</email>
              <email type="domain">imev-mer.fr</email>
            </editor>
            <funder ref="#projanr-50529"/>
          </titleStmt>
          <editionStmt>
            <edition n="v1" type="current">
              <date type="whenSubmitted">2022-07-12 21:14:03</date>
              <date type="whenModified">2025-05-21 18:51:14</date>
              <date type="whenReleased">2022-07-19 10:32:13</date>
              <date type="whenProduced">2022-04-04</date>
              <date type="whenEndEmbargoed">2022-07-12</date>
              <ref type="file" target="https://hal.sorbonne-universite.fr/hal-03721718v1/document">
                <date notBefore="2022-07-12"/>
              </ref>
              <ref type="file" subtype="greenPublisher" n="1" target="https://hal.sorbonne-universite.fr/hal-03721718v1/file/Schr%C3%B6der%20und%20Kiko%20-%202022%20-%20Assessing%20Representation%20Learning%20and%20Clustering%20A.pdf" id="file-3721718-3250906">
                <date notBefore="2022-07-12"/>
              </ref>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="1283761">
                <persName>
                  <forename>Rainer</forename>
                  <surname>Kiko</surname>
                </persName>
                <email type="md5">75b1f44c307197be66b6f6995f204323</email>
                <email type="domain">imev-mer.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">hal-03721718</idno>
            <idno type="halUri">https://hal.sorbonne-universite.fr/hal-03721718</idno>
            <idno type="halBibtex">schroder:hal-03721718</idno>
            <idno type="halRefHtml">&lt;i&gt;Sensors&lt;/i&gt;, 2022, 22, &lt;a target="_blank" href="https://dx.doi.org/10.3390/s22072775"&gt;&amp;#x27E8;10.3390/s22072775&amp;#x27E9;&lt;/a&gt;</idno>
            <idno type="halRef">Sensors, 2022, 22, &amp;#x27E8;10.3390/s22072775&amp;#x27E9;</idno>
            <availability status="restricted">
              <licence target="https://about.hal.science/hal-authorisation-v1/">HAL Authorization<ref corresp="#file-3721718-3250906"/></licence>
            </availability>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="SDE">Sciences De l'Environnement</idno>
            <idno type="stamp" n="INSU">INSU - Institut National des Sciences de l'Univers</idno>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="GIP-BE">GIP Bretagne Environnement</idno>
            <idno type="stamp" n="LOV" corresp="SORBONNE-UNIVERSITE">Laboratoire d'Océanographie de Villefranche</idno>
            <idno type="stamp" n="SORBONNE-UNIVERSITE">Sorbonne Université</idno>
            <idno type="stamp" n="SORBONNE-UNIV" corresp="SORBONNE-UNIVERSITE">Sorbonne Université 01/01/2018</idno>
            <idno type="stamp" n="SU-SCIENCES" corresp="SORBONNE-UNIVERSITE">Faculté des Sciences de Sorbonne Université</idno>
            <idno type="stamp" n="UMS-829" corresp="SORBONNE-UNIVERSITE">Institut de la mer de Villefranche</idno>
            <idno type="stamp" n="SU-TI">Sorbonne Université - Texte Intégral</idno>
            <idno type="stamp" n="ANR">ANR</idno>
            <idno type="stamp" n="ALLIANCE-SU"> Alliance Sorbonne Université</idno>
            <idno type="stamp" n="SUPRA_BIOLOGIE">Biologie hors MNHN &amp; stations</idno>
            <idno type="stamp" n="ANR-OCEANS-19TO21" corresp="ANR-OCEANS">ANR-OCEANS-19TO21</idno>
            <idno type="stamp" n="ANR-OCEANS">ANR-OCEANS</idno>
          </seriesStmt>
          <notesStmt>
            <note type="audience" n="2">International</note>
            <note type="popular" n="0">No</note>
            <note type="peer" n="1">Yes</note>
          </notesStmt>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">Assessing Representation Learning and Clustering Algorithms for Computer-Assisted Image Annotation—Simulating and Benchmarking MorphoCluster</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Simon-Martin</forename>
                    <surname>Schröder</surname>
                  </persName>
                  <idno type="idhal" notation="numeric">793252</idno>
                  <idno type="halauthorid" notation="string">1460801-793252</idno>
                  <idno type="ORCID">https://orcid.org/0000-0002-6603-9907</idno>
                  <affiliation ref="#struct-462123"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Rainer</forename>
                    <surname>Kiko</surname>
                  </persName>
                  <email type="md5">f718f12965718abc39e7108e14625fe2</email>
                  <email type="domain">obs-vlfr.fr</email>
                  <idno type="idhal" notation="string">rainer-kiko</idno>
                  <idno type="idhal" notation="numeric">1149536</idno>
                  <idno type="halauthorid" notation="string">963441-1149536</idno>
                  <idno type="ORCID">https://orcid.org/0000-0002-7851-9107</idno>
                  <idno type="IDREF">https://www.idref.fr/276034236</idno>
                  <idno type="GOOGLE SCHOLAR">https://scholar.google.fr/citations?user=5cGQZcYAAAAJ</idno>
                  <affiliation ref="#struct-541740"/>
                </author>
              </analytic>
              <monogr>
                <idno type="halJournalId" status="VALID">55556</idno>
                <idno type="issn">1424-8220</idno>
                <title level="j">Sensors</title>
                <imprint>
                  <publisher>MDPI</publisher>
                  <biblScope unit="volume">22</biblScope>
                  <date type="datePub">2022-04-04</date>
                </imprint>
              </monogr>
              <idno type="doi">10.3390/s22072775</idno>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <classCode scheme="halDomain" n="sde">Environmental Sciences</classCode>
              <classCode scheme="halTypology" n="ART">Journal articles</classCode>
              <classCode scheme="halOldTypology" n="ART">Journal articles</classCode>
              <classCode scheme="halTreeTypology" n="ART">Journal articles</classCode>
            </textClass>
            <abstract xml:lang="en">
              <p>Image annotation is a time-consuming and costly task. Previously, we published MorphoClusteras a novel image annotation tool to address problems of conventional, classifier-basedimage annotation approaches: their limited efficiency, training set bias and lack of novelty detection.MorphoCluster uses clustering and similarity search to enable efficient, computer-assisted imageannotation. In this work, we provide a deeper analysis of this approach. We simulate the actions ofa MorphoCluster user to avoid extensive manual annotation runs. This simulation is used to testsupervised, unsupervised and transfer representation learning approaches. Furthermore, shrunkenk-means and partially labeled k-means, two new clustering algorithms that are tailored specificallyfor the MorphoCluster approach, are compared to the previously used HDBSCAN*. We find thatlabeled training data improve the image representations, that unsupervised learning beats transferlearning and that all three clustering algorithms are viable options, depending on whether completeness,efficiency or runtime is the priority. The simulation results support our earlier findingthat MorphoCluster is very efficient and precise. Within the simulation, more than five objects persimulated click are being annotated with 95% precision.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="institution" xml:id="struct-462123" status="VALID">
          <idno type="IdRef">027909913</idno>
          <idno type="ISNI">0000000121539986</idno>
          <idno type="ROR">https://ror.org/04v76ef78</idno>
          <orgName>Christian-Albrechts-Universität zu Kiel = Christian-Albrechts University of Kiel = Université Christian-Albrechts de Kiel</orgName>
          <orgName type="acronym">CAU</orgName>
          <desc>
            <address>
              <addrLine>Christian-Albrechts-Platz 4, 24118 Kiel, Germany</addrLine>
              <country key="DE"/>
            </address>
            <ref type="url">http://www.uni-kiel.de/</ref>
          </desc>
        </org>
        <org type="laboratory" xml:id="struct-541740" status="VALID">
          <idno type="IdRef">153688688</idno>
          <idno type="ISNI">0000000403668890</idno>
          <idno type="RNSR">200112481S</idno>
          <idno type="ROR">https://ror.org/05r5y6641</idno>
          <orgName>Laboratoire d'océanographie de Villefranche</orgName>
          <orgName type="acronym">LOV</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>181, chemin du lazaret BP 28 06230 VILLEFRANCHE SUR MER Cedex</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://lov.imev-mer.fr/web/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-300045" type="direct"/>
            <relation active="#struct-413221" type="direct"/>
            <relation name="UMR7093" active="#struct-441569" type="direct"/>
            <relation active="#struct-559566" type="direct"/>
            <relation name="FR3761" active="#struct-300045" type="direct"/>
            <relation name="FR3761" active="#struct-413221" type="direct"/>
            <relation name="FR3761" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="institution" xml:id="struct-300045" status="VALID">
          <idno type="IdRef">029349265</idno>
          <idno type="ISNI">0000 0001 2154 1736</idno>
          <idno type="ROR">https://ror.org/04kdfz702</idno>
          <idno type="Wikidata">Q3152437</idno>
          <orgName>Institut national des sciences de l'Univers</orgName>
          <orgName type="acronym">INSU - CNRS</orgName>
          <date type="start">2007-04-19</date>
          <desc>
            <address>
              <addrLine>INSU-CNRS3 rue Michel-Ange, 75794 Paris Cedex 16</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.insu.cnrs.fr</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-413221" status="VALID">
          <idno type="IdRef">221333754</idno>
          <idno type="ROR">https://ror.org/02en5vm52</idno>
          <orgName>Sorbonne Université</orgName>
          <orgName type="acronym">SU</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>21 rue de l’École de médecine - 75006 Paris</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.sorbonne-universite.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
        <org type="regrouplaboratory" xml:id="struct-559566" status="VALID">
          <idno type="RNSR">201622338R</idno>
          <idno type="ROR">05jpad840</idno>
          <orgName>Institut de la Mer de Villefranche</orgName>
          <orgName type="acronym">IMEV</orgName>
          <desc>
            <address>
              <addrLine>Institut de la Mer de Villefranche (IMEV)CNRS - Sorbonne Université181 chemin du Lazaret06230 Villefranche-sur-Mer - FRANCE</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.imev-mer.fr/web/</ref>
          </desc>
          <listRelation>
            <relation name="FR3761" active="#struct-300045" type="direct"/>
            <relation name="FR3761" active="#struct-413221" type="direct"/>
            <relation name="FR3761" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
      </listOrg>
      <listOrg type="projects">
        <org type="anrProject" xml:id="projanr-50529" status="VALID">
          <idno type="anr">ANR-19-MPGA-0012</idno>
          <orgName>TAD</orgName>
          <desc>Tropical Atlantic Deoxygenation: gateway dynamics, feedback mechanisms and ecosystem impacts</desc>
          <date type="start">2019</date>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>