<?xml version="1.0" encoding="utf-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:hal="http://hal.archives-ouvertes.fr/" xmlns:gml="http://www.opengis.net/gml/3.3/" xmlns:gmlce="http://www.opengis.net/gml/3.3/ce" version="1.1" xsi:schemaLocation="http://www.tei-c.org/ns/1.0 http://api.archives-ouvertes.fr/documents/aofr-sword.xsd">
  <teiHeader>
    <fileDesc>
      <titleStmt>
        <title>HAL TEI export of hal-01306635</title>
      </titleStmt>
      <publicationStmt>
        <distributor>CCSD</distributor>
        <availability status="restricted">
          <licence target="https://creativecommons.org/publicdomain/zero/1.0/">CC0 1.0 - Universal</licence>
        </availability>
        <date when="2026-05-23T22:50:10+02:00"/>
      </publicationStmt>
      <sourceDesc>
        <p part="N">HAL API Platform</p>
      </sourceDesc>
    </fileDesc>
  </teiHeader>
  <text>
    <body>
      <listBibl>
        <biblFull>
          <titleStmt>
            <title xml:lang="en">On the efficiency of the Accelerated Processing Unit for scientific computing</title>
            <author role="aut">
              <persName>
                <forename type="first">Issam</forename>
                <surname>Said</surname>
              </persName>
              <email type="md5">2cae5d3ec5e7134fc68bf934d6033250</email>
              <email type="domain">lip6.fr</email>
              <idno type="idhal" notation="string">issam-said</idno>
              <idno type="idhal" notation="numeric">5652</idno>
              <idno type="halauthorid" notation="string">27213-5652</idno>
              <idno type="IDREF">https://www.idref.fr/193144557</idno>
              <affiliation ref="#struct-389984"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Pierre</forename>
                <surname>Fortin</surname>
              </persName>
              <email type="md5">e19e7b55edfec3940e3b1fc931ad011d</email>
              <email type="domain">univ-lille.fr</email>
              <idno type="idhal" notation="string">pierre-fortin</idno>
              <idno type="idhal" notation="numeric">2113</idno>
              <idno type="halauthorid" notation="string">13598-2113</idno>
              <idno type="IDREF">https://www.idref.fr/11411255X</idno>
              <idno type="ORCID">https://orcid.org/0000-0003-3117-9122</idno>
              <affiliation ref="#struct-389984"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Jean-Luc</forename>
                <surname>Lamotte</surname>
              </persName>
              <email type="md5">585849e6e80836c954a03ffaf6a8c2b2</email>
              <email type="domain">lip6.fr</email>
              <idno type="idhal" notation="numeric">966000</idno>
              <idno type="halauthorid" notation="string">682155-966000</idno>
              <affiliation ref="#struct-389984"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Romain</forename>
                <surname>Dolbeau</surname>
              </persName>
              <idno type="halauthorid">143907-0</idno>
              <affiliation ref="#struct-60443"/>
            </author>
            <author role="aut">
              <persName>
                <forename type="first">Henri</forename>
                <surname>Calandra</surname>
              </persName>
              <email type="md5">adc471e7369aaf46940638f304169f7b</email>
              <email type="domain">total.com</email>
              <idno type="idhal" notation="numeric">856259</idno>
              <idno type="halauthorid" notation="string">367318-856259</idno>
              <affiliation ref="#struct-154617"/>
            </author>
            <editor role="depositor">
              <persName>
                <forename>Pierre</forename>
                <surname>Fortin</surname>
              </persName>
              <email type="md5">e19e7b55edfec3940e3b1fc931ad011d</email>
              <email type="domain">univ-lille.fr</email>
            </editor>
          </titleStmt>
          <editionStmt>
            <edition n="v1" type="current">
              <date type="whenSubmitted">2016-04-25 11:00:27</date>
              <date type="whenModified">2023-04-11 15:16:28</date>
              <date type="whenReleased">2016-04-25 11:00:27</date>
              <date type="whenProduced">2016-04-03</date>
            </edition>
            <respStmt>
              <resp>contributor</resp>
              <name key="179241">
                <persName>
                  <forename>Pierre</forename>
                  <surname>Fortin</surname>
                </persName>
                <email type="md5">e19e7b55edfec3940e3b1fc931ad011d</email>
                <email type="domain">univ-lille.fr</email>
              </name>
            </respStmt>
          </editionStmt>
          <publicationStmt>
            <distributor>CCSD</distributor>
            <idno type="halId">hal-01306635</idno>
            <idno type="halUri">https://hal.sorbonne-universite.fr/hal-01306635</idno>
            <idno type="halBibtex">said:hal-01306635</idno>
            <idno type="halRefHtml">&lt;i&gt;24th High Performance Computing Symposium (HPC 2016)&lt;/i&gt;, Apr 2016, Pasadena, United States. pp.349-356, &lt;a target="_blank" href="https://dx.doi.org/10.22360/SpringSim.2016.HPC.040"&gt;&amp;#x27E8;10.22360/SpringSim.2016.HPC.040&amp;#x27E9;&lt;/a&gt;</idno>
            <idno type="halRef">24th High Performance Computing Symposium (HPC 2016), Apr 2016, Pasadena, United States. pp.349-356, &amp;#x27E8;10.22360/SpringSim.2016.HPC.040&amp;#x27E9;</idno>
            <availability status="restricted"/>
          </publicationStmt>
          <seriesStmt>
            <idno type="stamp" n="UPMC" corresp="SORBONNE-UNIVERSITE">Université Pierre et Marie Curie</idno>
            <idno type="stamp" n="CNRS">CNRS - Centre national de la recherche scientifique</idno>
            <idno type="stamp" n="LIP6" corresp="SORBONNE-UNIVERSITE">Laboratoire d'Informatique de Paris 6</idno>
            <idno type="stamp" n="UPMC_POLE_1" corresp="UPMC">UPMC Pôle 1</idno>
            <idno type="stamp" n="SORBONNE-UNIVERSITE">Sorbonne Université</idno>
            <idno type="stamp" n="SU-SCIENCES" corresp="SORBONNE-UNIVERSITE">Faculté des Sciences de Sorbonne Université</idno>
            <idno type="stamp" n="ALLIANCE-SU"> Alliance Sorbonne Université</idno>
          </seriesStmt>
          <notesStmt>
            <note type="audience" n="2">International</note>
            <note type="invited" n="0">No</note>
            <note type="popular" n="0">No</note>
            <note type="peer" n="1">Yes</note>
            <note type="proceedings" n="1">Yes</note>
          </notesStmt>
          <sourceDesc>
            <biblStruct>
              <analytic>
                <title xml:lang="en">On the efficiency of the Accelerated Processing Unit for scientific computing</title>
                <author role="aut">
                  <persName>
                    <forename type="first">Issam</forename>
                    <surname>Said</surname>
                  </persName>
                  <email type="md5">2cae5d3ec5e7134fc68bf934d6033250</email>
                  <email type="domain">lip6.fr</email>
                  <idno type="idhal" notation="string">issam-said</idno>
                  <idno type="idhal" notation="numeric">5652</idno>
                  <idno type="halauthorid" notation="string">27213-5652</idno>
                  <idno type="IDREF">https://www.idref.fr/193144557</idno>
                  <affiliation ref="#struct-389984"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Pierre</forename>
                    <surname>Fortin</surname>
                  </persName>
                  <email type="md5">e19e7b55edfec3940e3b1fc931ad011d</email>
                  <email type="domain">univ-lille.fr</email>
                  <idno type="idhal" notation="string">pierre-fortin</idno>
                  <idno type="idhal" notation="numeric">2113</idno>
                  <idno type="halauthorid" notation="string">13598-2113</idno>
                  <idno type="IDREF">https://www.idref.fr/11411255X</idno>
                  <idno type="ORCID">https://orcid.org/0000-0003-3117-9122</idno>
                  <affiliation ref="#struct-389984"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Jean-Luc</forename>
                    <surname>Lamotte</surname>
                  </persName>
                  <email type="md5">585849e6e80836c954a03ffaf6a8c2b2</email>
                  <email type="domain">lip6.fr</email>
                  <idno type="idhal" notation="numeric">966000</idno>
                  <idno type="halauthorid" notation="string">682155-966000</idno>
                  <affiliation ref="#struct-389984"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Romain</forename>
                    <surname>Dolbeau</surname>
                  </persName>
                  <idno type="halauthorid">143907-0</idno>
                  <affiliation ref="#struct-60443"/>
                </author>
                <author role="aut">
                  <persName>
                    <forename type="first">Henri</forename>
                    <surname>Calandra</surname>
                  </persName>
                  <email type="md5">adc471e7369aaf46940638f304169f7b</email>
                  <email type="domain">total.com</email>
                  <idno type="idhal" notation="numeric">856259</idno>
                  <idno type="halauthorid" notation="string">367318-856259</idno>
                  <affiliation ref="#struct-154617"/>
                </author>
              </analytic>
              <monogr>
                <title level="m">Proceedings of the 2016 Spring Simulation Multi-Conference (SPRINGSIM).</title>
                <meeting>
                  <title>24th High Performance Computing Symposium (HPC 2016)</title>
                  <date type="start">2016-04-03</date>
                  <date type="end">2016-04-06</date>
                  <settlement>Pasadena</settlement>
                  <country key="US">United States</country>
                </meeting>
                <imprint>
                  <publisher>Society for Computer Simulation International</publisher>
                  <biblScope unit="pp">349-356</biblScope>
                </imprint>
              </monogr>
              <idno type="doi">10.22360/SpringSim.2016.HPC.040</idno>
            </biblStruct>
          </sourceDesc>
          <profileDesc>
            <langUsage>
              <language ident="en">English</language>
            </langUsage>
            <textClass>
              <classCode scheme="halDomain" n="scco.comp">Cognitive science/Computer science</classCode>
              <classCode scheme="halTypology" n="COMM">Conference papers</classCode>
              <classCode scheme="halOldTypology" n="COMM">Conference papers</classCode>
              <classCode scheme="halTreeTypology" n="COMM">Conference papers</classCode>
            </textClass>
            <abstract xml:lang="en">
              <p>The AMD APU (Accelerated Processing Unit) architecture, which combines CPU and GPU cores on the same die at a low power budget, promises a significant advent in GPU computing, in particular to applications which performance is bottlenecked by the low PCI communication rate. However APUs are slowly heading towards a perfectly unified CPU-GPU memory space. Besides, APU integrated GPUs are also less powerful than discrete GPUs. In this paper we therefore investigate the interest of APUs for scientific computing by evaluating and comparing the performance and the power efficiency of an AMD APU (code-named Kaveri) against a discrete GPU (code-named Tahiti) and an hexa-core AMD CPU (Phenom CPU). For this purpose, we rely on two common applicative benchmarks in single precision, namely a matrix-matrix multiplication and a 3D finite difference stencil, that are optimized and tuned in OpenCL. Our results confirm that APU integrated GPUs outperform CPUs and may outperform discrete GPUs for medium-sized problems as well as for applications with high communication requirements. Moreover, our study shows that APUs can be up to 20% more power efficient than discrete GPUs.</p>
            </abstract>
          </profileDesc>
        </biblFull>
      </listBibl>
    </body>
    <back>
      <listOrg type="structures">
        <org type="researchteam" xml:id="struct-389984" status="OLD">
          <orgName>Performance et Qualité des Algorithmes Numériques</orgName>
          <orgName type="acronym">PEQUAN</orgName>
          <date type="start">2004-01-01</date>
          <date type="end">2017-12-31</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
          </desc>
          <listRelation>
            <relation active="#struct-233" type="direct"/>
            <relation active="#struct-93591" type="indirect"/>
            <relation name="UMR7606" active="#struct-441569" type="indirect"/>
          </listRelation>
        </org>
        <org type="laboratory" xml:id="struct-60443" status="VALID">
          <orgName>CAPS Enterprise</orgName>
          <orgName type="acronym">CAPS</orgName>
          <desc>
            <address>
              <addrLine>CAPS entreprise Immeuble CAP Nord – Bât A 4 Allée Marie Berhaut 35000 Rennes – France</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.caps-entreprise.com/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-314212" type="direct"/>
          </listRelation>
        </org>
        <org type="laboratory" xml:id="struct-154617" status="VALID">
          <orgName>Total E&amp;P</orgName>
          <desc>
            <address>
              <country key="FR"/>
            </address>
          </desc>
          <listRelation>
            <relation active="#struct-328942" type="direct"/>
          </listRelation>
        </org>
        <org type="laboratory" xml:id="struct-233" status="OLD">
          <idno type="RNSR">199712651U</idno>
          <idno type="ROR">https://ror.org/05krcen59</idno>
          <orgName>Laboratoire d'Informatique de Paris 6</orgName>
          <orgName type="acronym">LIP6</orgName>
          <date type="start">1997-01-01</date>
          <date type="end">2017-12-31</date>
          <desc>
            <address>
              <addrLine>4 Place JUSSIEU 75252 PARIS CEDEX 05</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.lip6.fr/</ref>
          </desc>
          <listRelation>
            <relation active="#struct-93591" type="direct"/>
            <relation name="UMR7606" active="#struct-441569" type="direct"/>
          </listRelation>
        </org>
        <org type="institution" xml:id="struct-93591" status="OLD">
          <idno type="ROR">https://ror.org/02en5vm52</idno>
          <orgName>Université Pierre et Marie Curie - Paris 6</orgName>
          <orgName type="acronym">UPMC</orgName>
          <date type="end">2017-12-31</date>
          <desc>
            <address>
              <addrLine>4 place Jussieu - 75005 Paris</addrLine>
              <country key="FR"/>
            </address>
            <ref type="url">http://www.upmc.fr/</ref>
          </desc>
        </org>
        <org type="regroupinstitution" xml:id="struct-441569" status="VALID">
          <idno type="IdRef">02636817X</idno>
          <idno type="ISNI">0000000122597504</idno>
          <idno type="ROR">https://ror.org/02feahw73</idno>
          <orgName>Centre National de la Recherche Scientifique</orgName>
          <orgName type="acronym">CNRS</orgName>
          <date type="start">1939-10-19</date>
          <desc>
            <address>
              <country key="FR"/>
            </address>
            <ref type="url">https://www.cnrs.fr/</ref>
          </desc>
        </org>
        <org type="institution" xml:id="struct-314212" status="INCOMING">
          <orgName>CAPS Enterprise</orgName>
          <desc>
            <address>
              <country key="FR"/>
            </address>
          </desc>
        </org>
        <org type="institution" xml:id="struct-328942" status="INCOMING">
          <orgName>Total E&amp;P</orgName>
          <desc>
            <address>
              <country key="FR"/>
            </address>
          </desc>
        </org>
      </listOrg>
    </back>
  </text>
</TEI>