<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of hal-04908413</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-19T20:50:45+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">Diverse patterns of correspondence between protist metabarcodes and protist metagenome-assembled genomes</title>
            <author role="aut">
              <persName>
                <forename type="first">Daryna</forename>
                <surname>Zavadska</surname>
              </persName>
              <idno type="halauthorid">3385962-0</idno>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Nicolas</forename>
                <surname>Henry</surname>
              </persName>
              <email type="md5">f0759072afd17b924cc7d5517e939859</email>
              <email type="domain">sb-roscoff.fr</email>
              <idno type="idhal" notation="string">nicolas-henry</idno>
              <idno type="idhal" notation="numeric">751540</idno>
              <idno type="halauthorid" notation="string">16013-751540</idno>
              <idno type="ORCID">https://orcid.org/0000-0002-7702-1382</idno>
              <idno type="IDREF">https://www.idref.fr/196940427</idno>
              <idno type="GOOGLE SCHOLAR">https://scholar.google.fr/citations?user=qcZ0di8AAAAJ</idno>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Adrià</forename>
                <surname>Auladell</surname>
              </persName>
              <idno type="halauthorid">2057565-0</idno>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Cédric</forename>
                <surname>Berney</surname>
              </persName>
              <idno type="idhal" notation="numeric">772942</idno>
              <idno type="halauthorid" notation="string">879693-772942</idno>
              <idno type="ORCID">https://orcid.org/0000-0001-8689-9907</idno>
              <affiliation ref="#struct-541812"/>
              <affiliation ref="#struct-572106"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Daniel</forename>
                <surname>Richter</surname>
              </persName>
              <idno type="halauthorid">6100-0</idno>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Laure</forename>
                <surname>Guillou</surname>
              </persName>
              <email type="md5">5f5a3a51fca72bb21e56ccac20c9dac7</email>
              <email type="domain">sb-roscoff.fr</email>
            </editor>
          </titleStmt>
          <editionStmt>
            <edition n="v1" type="current">
              <date type="whenSubmitted">2025-01-23 14:19:19</date>
              <date type="whenModified">2026-03-11 10:04:08</date>
              <date type="whenReleased">2025-01-23 14:19:19</date>
              <date type="whenProduced">2024-06-06</date>
              <ref type="externalLink" target="https://www.ncbi.nlm.nih.gov/pmc/articles/11156365"/>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="323854">
                <persName>
                  <forename>Laure</forename>
                  <surname>Guillou</surname>
                </persName>
                <email type="md5">5f5a3a51fca72bb21e56ccac20c9dac7</email>
                <email type="domain">sb-roscoff.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">hal-04908413</idno>
            <idno type="halUri">https://hal.sorbonne-universite.fr/hal-04908413</idno>
            <idno type="halBibtex">zavadska:hal-04908413</idno>
            <idno type="halRefHtml">&lt;i&gt;PLoS ONE&lt;/i&gt;, 2024, 19 (6), pp.e0303697. &lt;a target="_blank" href="https://dx.doi.org/10.1371/journal.pone.0303697"&gt;&amp;#x27E8;10.1371/journal.pone.0303697&amp;#x27E9;&lt;/a&gt;</idno>
            <idno type="halRef">PLoS ONE, 2024, 19 (6), pp.e0303697. &amp;#x27E8;10.1371/journal.pone.0303697&amp;#x27E9;</idno>
            <availability status="restricted"/>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="SDE">Sciences De l'Environnement</idno>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="GIP-BE">GIP Bretagne Environnement</idno>
            <idno type="stamp" n="ADMM" corresp="SBR">Adaptation et Diversité en Milieu Marin</idno>
            <idno type="stamp" n="SORBONNE-UNIVERSITE">Sorbonne Université</idno>
            <idno type="stamp" n="SORBONNE-UNIV" corresp="SORBONNE-UNIVERSITE">Sorbonne Université 01/01/2018</idno>
            <idno type="stamp" n="SU-SCIENCES" corresp="SORBONNE-UNIVERSITE">Faculté des Sciences de Sorbonne Université</idno>
            <idno type="stamp" n="SU-TI">Sorbonne Université - Texte Intégral</idno>
            <idno type="stamp" n="ALLIANCE-SU"> Alliance Sorbonne Université</idno>
            <idno type="stamp" n="SBR" corresp="SORBONNE-UNIVERSITE">Station biologique de Roscoff</idno>
            <idno type="stamp" n="INEE-CNRS">Institut écologie et environnement du CNRS</idno>
            <idno type="stamp" n="SUPRA_BIOLOGIE">Biologie hors MNHN &amp; stations</idno>
            <idno type="stamp" n="ECOMAP" corresp="ADMM">ECOlogy of MArine Plankton team</idno>
          </seriesStmt>
          <notesStmt>
            <note type="audience" n="2">International</note>
            <note type="popular" n="0">No</note>
            <note type="peer" n="1">Yes</note>
          </notesStmt>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">Diverse patterns of correspondence between protist metabarcodes and protist metagenome-assembled genomes</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Daryna</forename>
                    <surname>Zavadska</surname>
                  </persName>
                  <idno type="halauthorid">3385962-0</idno>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Nicolas</forename>
                    <surname>Henry</surname>
                  </persName>
                  <email type="md5">f0759072afd17b924cc7d5517e939859</email>
                  <email type="domain">sb-roscoff.fr</email>
                  <idno type="idhal" notation="string">nicolas-henry</idno>
                  <idno type="idhal" notation="numeric">751540</idno>
                  <idno type="halauthorid" notation="string">16013-751540</idno>
                  <idno type="ORCID">https://orcid.org/0000-0002-7702-1382</idno>
                  <idno type="IDREF">https://www.idref.fr/196940427</idno>
                  <idno type="GOOGLE SCHOLAR">https://scholar.google.fr/citations?user=qcZ0di8AAAAJ</idno>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Adrià</forename>
                    <surname>Auladell</surname>
                  </persName>
                  <idno type="halauthorid">2057565-0</idno>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Cédric</forename>
                    <surname>Berney</surname>
                  </persName>
                  <idno type="idhal" notation="numeric">772942</idno>
                  <idno type="halauthorid" notation="string">879693-772942</idno>
                  <idno type="ORCID">https://orcid.org/0000-0001-8689-9907</idno>
                  <affiliation ref="#struct-541812"/>
                  <affiliation ref="#struct-572106"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Daniel</forename>
                    <surname>Richter</surname>
                  </persName>
                  <idno type="halauthorid">6100-0</idno>
                </author>
              </analytic>
              <monogr>
                <idno type="halJournalId" status="VALID">28700</idno>
                <idno type="issn">1932-6203</idno>
                <idno type="eissn">1932-6203</idno>
                <title level="j">PLoS ONE</title>
                <imprint>
                  <publisher>Public Library of Science</publisher>
                  <biblScope unit="volume">19</biblScope>
                  <biblScope unit="issue">6</biblScope>
                  <biblScope unit="pp">e0303697</biblScope>
                  <date type="datePub">2024-06-06</date>
                </imprint>
              </monogr>
              <idno type="doi">10.1371/journal.pone.0303697</idno>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <classCode scheme="halDomain" n="sde">Environmental Sciences</classCode>
              <classCode scheme="halTypology" n="ART">Journal articles</classCode>
              <classCode scheme="halOldTypology" n="ART">Journal articles</classCode>
              <classCode scheme="halTreeTypology" n="ART">Journal articles</classCode>
            </textClass>
            <abstract xml:lang="en">
              <p>Two common approaches to study the composition of environmental protist communities are metabarcoding and metagenomics. Raw metabarcoding data are usually processed into Operational Taxonomic Units (OTUs) or amplicon sequence variants (ASVs) through clustering or denoising approaches, respectively. Analogous approaches are used to assemble metagenomic reads into metagenome-assembled genomes (MAGs). Understanding the correspondence between the data produced by these two approaches can help to integrate information between the datasets and to explain how metabarcoding OTUs and MAGs are related with the underlying biological entities they are hypothesised to represent. MAGs do not contain the commonly used barcoding loci, therefore sequence homology approaches cannot be used to match OTUs and MAGs. We made an attempt to match V9 metabarcoding OTUs from the 18S rRNA gene (V9 OTUs) and MAGs from the Tara Oceans expedition based on the correspondence of their relative abundances across the same set of samples. We evaluated several metrics for detecting correspondence between features in these two datasets and developed controls to filter artefacts of data structure and processing. After selecting the best-performing metrics, ranking the V9 OTU/MAG matches by their proportionality/correlation coefficients and applying a set of selection criteria, we identified candidate matches between V9 OTUs and MAGs. In some cases, V9 OTUs and MAGs could be matched with a one-to-one correspondence, implying that they likely represent the same underlying biological entity. More generally, matches we observed could be classified into 4 scenarios: one V9 OTU matches many MAGs; many V9 OTUs match many MAGs; many V9 OTUs match one MAG; one V9 OTU matches one MAG. Notably, we found some instances in which different OTU-MAG matches from the same taxonomic group were not classified in the same scenario, with all four scenarios possible even within the same taxonomic group, illustrating that factors beyond taxonomic lineage influence the relationship between OTUs and MAGs. Overall, each scenario produces a different interpretation of V9 OTUs, MAGs and how they compare in terms of the genomic and ecological diversity they represent.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="laboratory" xml:id="struct-541812" status="VALID">
          <idno type="IdRef">242206565</idno>
          <idno type="ISNI">0000000403687354</idno>
          <idno type="RNSR">200512529B</idno>
          <idno type="ROR">https://ror.org/0293jn610</idno>
          <orgName>Adaptation et diversité en milieu marin</orgName>
          <orgName type="acronym">AD2M</orgName>
          <date type="start">2017-01-01</date>
          <desc>
            <address>
              <addrLine>Place Georges Teissier - BP 74 29682 ROSCOFF CEDEX</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.sb-roscoff.fr/fr/unite-adaptation-et-diversite-en-milieu-marin</ref>
          </desc>
          <listRelation>
            <relation active="#struct-413221" type="direct"/>
            <relation name="UMR7144" active="#struct-441569" type="direct"/>
            <relation name="UMR 7144" active="#struct-541806" type="direct"/>
            <relation name="FR2424" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="researchteam" xml:id="struct-572106" status="VALID">
          <orgName>ECOlogy of MArine Plankton</orgName>
          <orgName type="acronym">ECOMAP</orgName>
          <date type="start">2019-01-01</date>
          <desc>
            <address>
              <addrLine>Place Georges Teissier29680 Roscoff</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.sb-roscoff.fr/fr/ecomap</ref>
          </desc>
          <listRelation>
            <relation active="#struct-541812" type="direct"/>
            <relation active="#struct-413221" type="indirect"/>
            <relation name="UMR7144" active="#struct-441569" type="indirect"/>
            <relation name="UMR 7144" active="#struct-541806" type="indirect"/>
            <relation name="FR2424" active="#struct-441569" type="indirect"/>
          </listRelation>
        </org>
        <org type="regroupinstitution" xml:id="struct-413221" status="VALID">
          <idno type="IdRef">221333754</idno>
          <idno type="ROR">https://ror.org/02en5vm52</idno>
          <orgName>Sorbonne Université</orgName>
          <orgName type="acronym">SU</orgName>
          <date type="start">2018-01-01</date>
          <desc>
            <address>
              <addrLine>21 rue de l’École de médecine - 75006 Paris</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.sorbonne-universite.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
        <org type="regrouplaboratory" xml:id="struct-541806" status="VALID">
          <idno type="RNSR">200119846X</idno>
          <idno type="ROR">https://ror.org/03s0pzj56</idno>
          <orgName>Station biologique de Roscoff = Roscoff Marine Station</orgName>
          <orgName type="acronym">SBR</orgName>
          <desc>
            <address>
              <addrLine>Place Georges Teissier - BP 74 29682 ROSCOFF CEDEX</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.sb-roscoff.fr</ref>
          </desc>
          <listRelation>
            <relation active="#struct-413221" type="direct"/>
            <relation name="FR2424" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>