<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//TaxonX//DTD Taxonomic Treatment Publishing DTD v0 20100105//EN" "../../nlm/tax-treatment-NS0.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:tp="http://www.plazi.org/taxpub" article-type="research-article">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">17</journal-id>
      <journal-id journal-id-type="index">urn:lsid:arphahub.com:pub:8E638694-B4E0-570A-856A-746FF325BF6B</journal-id>
      <journal-title-group>
        <journal-title xml:lang="en">Research Ideas and Outcomes</journal-title>
        <abbrev-journal-title xml:lang="en">RIO</abbrev-journal-title>
      </journal-title-group>
      <issn pub-type="epub">2367-7163</issn>
      <publisher>
        <publisher-name>Pensoft Publishers</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.3897/rio.8.e94758</article-id>
      <article-id pub-id-type="publisher-id">94758</article-id>
      <article-id pub-id-type="manuscript">20471</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Conference Abstract</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Realizing FAIR Digital Objects for the German Helmholtz Association of Research Centres</article-title>
      </title-group>
      <contrib-group content-type="authors">
        <contrib contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Jejkal</surname>
            <given-names>Thomas</given-names>
          </name>
          <email xlink:type="simple">thomas.jejkal@kit.edu</email>
          <uri content-type="orcid">https://orcid.org/0000-0003-2804-688X</uri>
          <xref ref-type="aff" rid="A1">1</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Pfeil</surname>
            <given-names>Andreas</given-names>
          </name>
          <uri content-type="orcid">https://orcid.org/0000-0001-6575-1022</uri>
          <xref ref-type="aff" rid="A1">1</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Schweikert</surname>
            <given-names>Jan</given-names>
          </name>
          <uri content-type="orcid">https://orcid.org/0000-0003-4774-2717</uri>
          <xref ref-type="aff" rid="A1">1</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Pirogov</surname>
            <given-names>Anton</given-names>
          </name>
          <uri content-type="orcid">https://orcid.org/0000-0002-5077-7497</uri>
          <xref ref-type="aff" rid="A2">2</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Barranco</surname>
            <given-names>Pedro Videgain</given-names>
          </name>
          <xref ref-type="aff" rid="A2">2</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Krebs</surname>
            <given-names>Florian</given-names>
          </name>
          <uri content-type="orcid">https://orcid.org/0000-0001-6033-801X</uri>
          <xref ref-type="aff" rid="A3">3</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Koch</surname>
            <given-names>Christian</given-names>
          </name>
          <xref ref-type="aff" rid="A4">4</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Guenther</surname>
            <given-names>Gerrit</given-names>
          </name>
          <uri content-type="orcid">https://orcid.org/0000-0001-6243-1728</uri>
          <xref ref-type="aff" rid="A5">5</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Curdt</surname>
            <given-names>Constanze</given-names>
          </name>
          <xref ref-type="aff" rid="A6">6</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Weinelt</surname>
            <given-names>Martin</given-names>
          </name>
          <xref ref-type="aff" rid="A6">6</xref>
        </contrib>
      </contrib-group>
      <aff id="A1">
        <label>1</label>
        <addr-line content-type="verbatim">Karlsruhe Institute of Technology, Eggenstein-Leopoldshafen, Germany</addr-line>
        <institution>Karlsruhe Institute of Technology</institution>
        <addr-line content-type="city">Eggenstein-Leopoldshafen</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A2">
        <label>2</label>
        <addr-line content-type="verbatim">Forschungszentrum Juelich, Juelich, Germany</addr-line>
        <institution>Forschungszentrum Juelich</institution>
        <addr-line content-type="city">Juelich</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A3">
        <label>3</label>
        <addr-line content-type="verbatim">German Aerospace Center, Bonn, Germany</addr-line>
        <institution>German Aerospace Center</institution>
        <addr-line content-type="city">Bonn</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A4">
        <label>4</label>
        <addr-line content-type="verbatim">German Cancer Research Center, Heidelberg, Germany</addr-line>
        <institution>German Cancer Research Center</institution>
        <addr-line content-type="city">Heidelberg</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A5">
        <label>5</label>
        <addr-line content-type="verbatim">Helmholtz-Zentrum Berlin, Berlin, Germany</addr-line>
        <institution>Helmholtz-Zentrum Berlin</institution>
        <addr-line content-type="city">Berlin</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A6">
        <label>6</label>
        <addr-line content-type="verbatim">Geomar, Kiel, Germany</addr-line>
        <institution>Geomar</institution>
        <addr-line content-type="city">Kiel</addr-line>
        <country>Germany</country>
      </aff>
      <author-notes>
        <fn fn-type="corresp">
          <p>Corresponding author: Thomas Jejkal (<email xlink:type="simple">thomas.jejkal@kit.edu</email>).</p>
        </fn>
        <fn fn-type="edited-by">
          <p>Academic editor: </p>
        </fn>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>12</day>
        <month>10</month>
        <year>2022</year>
      </pub-date>
      <volume>8</volume>
      <elocation-id>e94758</elocation-id>
      <uri content-type="arpha" xlink:href="http://openbiodiv.net/A35EEE99-16B0-502C-88A9-836167CDFCD2">A35EEE99-16B0-502C-88A9-836167CDFCD2</uri>
      <uri content-type="zenodo_dep_id" xlink:href="https://zenodo.org/record/0">0</uri>
      <permissions>
        <copyright-statement>Thomas Jejkal, Andreas Pfeil, Jan Schweikert, Anton Pirogov, Pedro Videgain Barranco, Florian Krebs, Christian Koch, Gerrit Guenther, Constanze Curdt, Martin Weinelt</copyright-statement>
        <license license-type="creative-commons-attribution" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
          <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution License (CC BY 4.0), which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
        </license>
      </permissions>
      <abstract>
        <label>Abstract</label>
        <p>The Helmholtz Association (<xref ref-type="bibr" rid="B8006492">Anonymous 2022d</xref>), the largest association of large-scale research centres in Germany, covers a wide range of research fields employing more than 43.000 researchers. In 2019, the Helmholtz Metadata Collaboration (HMC) (<xref ref-type="bibr" rid="B8006538">Anonymous 2022f</xref>) Platform as a joint endeavor across all research areas of the Helmholtz Association was started to make the depth and breadth of research data produced by Helmholtz Centres findable, accessible, interoperable, and reusable (FAIR) for the whole science community. To reach this goal, the concept of FAIR Digital Objects (FAIR DOs) has been chosen as top-level commonality for existing and future infrastructures of all research fields.</p>
        <p>In doing so, HMC follows the original approach of realizing FAIR DOs based on globally unique, Persistent Identifiers (PID), e.g., provided by <ext-link ext-link-type="uri" xlink:href="https://handle.net/">https://handle.net/</ext-link>, machine actionable PID Records and strong typing using Data Types like <ext-link ext-link-type="uri" xlink:href="https://dtr-test.pidconsortium.eu/#objects/21.T11148/1c699a5d1b4ad3ba4956">https://dtr-test.pidconsortium.eu/#objects/21.T11148/1c699a5d1b4ad3ba4956</ext-link> registered in a Data Type Registry, e.g., <ext-link ext-link-type="uri" xlink:href="http://dtr-test.pidconsortium.eu/">http://dtr-test.pidconsortium.eu/</ext-link>. In all these areas, HMC can build on the great groundwork of the Research Data Alliance and the FAIR DO Forum. However, when it comes to realization, there are still some gaps that will have to be addressed during our work and will be raised in this presentation.  </p>
        <p>For single FAIR DO components like PIDs and Data Types, existing infrastructures are already available. Here, the Gesellschaft für wissenschaftliche Datenverarbeitung mbH Göttingen (GWDG) (<xref ref-type="bibr" rid="B8006500">Anonymous 2022e</xref>) provides strong support with their many years of experience in this field. Within the framework of the ePIC consortium (<xref ref-type="bibr" rid="B8006484">Anonymous 2022c</xref>), the GWDG is offering on the one hand PID prefixes based on a sustainable business model, on the other hand GWDG is very active in terms of providing base services required for realizing FAIR DOs, e.g., different instances of Data Type Registries for accessing, creating, and managing Data Types required by FAIR DOs. Besides that, in the context of HMC we developed a couple of technical components to support the creation and management of FAIR DOs: The Typed PID Maker (<xref ref-type="bibr" rid="B8006508">Pfeil 2022b</xref>) providing machine actionable interfaces for creating, validating, and managing PIDs with machine-actionable metadata stored in their PID record, or the FAIR DO testbed, currently evolving into the FAIR DO Lab (<xref ref-type="bibr" rid="B8006516">Pfeil 2022a</xref>), serving as reference implementation for setting up a FAIR DO ecosystem. However, introducing FAIR DOs is not only about providing technical services, but also requires the definition and agreement on interfaces, policies, and processes.</p>
        <p>A first step in this direction was made in the context of HMC by agreeing on a Helmholtz Kernel Information Profile (<ext-link ext-link-type="uri" xlink:href="http://dtr-test.pidconsortium.eu/#objects/21.T11148/b9b76f887845e32d29f7">http://dtr-test.pidconsortium.eu/#objects/21.T11148/b9b76f887845e32d29f7</ext-link>). In the concept of FAIR DOs, PID Kernel Information as defined by Weigel et al. (<xref ref-type="bibr" rid="B8006524">Weigel et al. 2018</xref>) is key to machine actionability of digital content. Strongly relying on Data Types and stored in the PID record directly at the PID resolution service, PID Kernel Information can be used by machines for fast decision making. The Helmholtz Kernel Information Profile is an attempt to introduce a top-level commonality across all digital assets produced within the Helmholtz Association and beyond to establish a basis for FAIR research data based on FAIR DOs.</p>
        <p>Hereby, the Helmholtz Kernel Information Profile integrates the recommendations of the RDA PID Kernel Information Working Group (<xref ref-type="bibr" rid="B8006476">Anonymous 2022b</xref>) as far as possible. By extending the Draft Kernel Information Profile (<xref ref-type="bibr" rid="B8006524">Weigel et al. 2018</xref>) with additional, mostly optional attributes, the Helmholtz Kernel Information Profile allows the adding of contextual information to FAIR DOs, e.g., research topic, or contact information, which is then available for machine decisions. Furthermore, additional properties for representing relationships between FAIR DOs, e.g, hasMetadata and isMetadataFor, were introduced to allow mutual relations between FAIR DOs.</p>
        <p>Currently, a demonstrator is implemented integrating the above components and services, i.e., PID Service, Data Type Registry, and Typed PID Maker. Fig. <xref ref-type="fig" rid="F8006394">1</xref> outlines the architecture overview of the first version of the demonstrator.</p>
        <p>In this first version, in a semi-automatic workflow, a user enters a Zenodo (<xref ref-type="bibr" rid="B8006468">Anonymous 2022a</xref>) PID in a graphical Web frontend. A mapping component tries to fill automatically at least the properties required by the Helmholtz Kernel Information Profile using the obtained Zenodo metadata record. In a manual validation loop, the user may add or update certain properties before they are sent to an instance of the Typed PID Maker, validated against the Helmholtz Kernel Information Profile, and stored in the record of a newly registered PID using the services of the ePIC consortium. In addition, registered PID records are made searchable via the graphical frontend on top of a search index, e.g., realized using <ext-link ext-link-type="uri" xlink:href="https://www.elastic.co/">https://www.elastic.co/</ext-link>.</p>
        <p>After implementing this generic workflow, additional mappers supporting other repository platforms will be implemented based on the lessons learned, which will lead to a growing number of FAIR DOs and holds potential for providing significant benefits to scientists, e.g., a central point of contact for research data sets stored in different repositories, machine-actionable identification of relevant datasets, and creation of knowledge graphs representing relationships between data sets, repository platforms, researchers and research organizations.</p>
        <p>Furthermore, the gathered experience and its documentation will help others to apply the FAIR DO concept more easily, which will lead to an ever-growing collection of available FAIR DOs with an increasing quality and level of automation at creation time.</p>
      </abstract>
      <kwd-group>
        <label>Keywords</label>
        <kwd>Helmholtz Metadata Collaboration Platform</kwd>
        <kwd>Persistent Identifiers</kwd>
        <kwd>PID Kernel Information Profile</kwd>
        <kwd>Demonstrator</kwd>
      </kwd-group>
      <funding-group>
        <funding-statement>This work has been supported by the research program ‘Engineering Digital Futures’ of the Helmholtz Association of German Research Centers and the Helmholtz Metadata Collaboration Platform.</funding-statement>
      </funding-group>
      <counts>
        <fig-count count="1"/>
        <table-count count="0"/>
        <ref-count count="9"/>
      </counts>
    </article-meta>
    <notes>
      <sec sec-type="Presenting author">
        <title>Presenting author</title>
        <p>Thomas Jejkal</p>
      </sec>
      <sec sec-type="Presented at">
        <title>Presented at</title>
        <p>First International Conference on FAIR Digital Objects, presentation</p>
      </sec>
    </notes>
  </front>
  <back>
    <ref-list>
      <title>References</title>
      <ref id="B8006468">
        <element-citation publication-type="other">
          <person-group person-group-type="author">
            <anonymous/>
          </person-group>
          <year>2022</year>
          <article-title>Zenodo</article-title>
          <uri>https://zenodo.org/</uri>
        </element-citation>
      </ref>
      <ref id="B8006476">
        <element-citation publication-type="other">
          <person-group person-group-type="author">
            <anonymous/>
          </person-group>
          <year>2022</year>
          <article-title>PID Kernel Information Working Group</article-title>
          <uri>https://www.rd-alliance.org/groups/pid-kernel-information-wg</uri>
        </element-citation>
      </ref>
      <ref id="B8006484">
        <element-citation publication-type="other">
          <person-group person-group-type="author">
            <anonymous/>
          </person-group>
          <year>2022</year>
          <article-title>Persistent Identifiers for eResearch (ePIC)</article-title>
          <uri>https://www.pidconsortium.net/</uri>
        </element-citation>
      </ref>
      <ref id="B8006492">
        <element-citation publication-type="other">
          <person-group person-group-type="author">
            <anonymous/>
          </person-group>
          <year>2022</year>
          <article-title>Helmholtz Association</article-title>
          <uri>https://www.helmholtz.de/</uri>
        </element-citation>
      </ref>
      <ref id="B8006500">
        <element-citation publication-type="other">
          <person-group person-group-type="author">
            <anonymous/>
          </person-group>
          <year>2022</year>
          <article-title>Gesellschaft für wissenschaftliche Datenverarbeitung mbH Göttingen</article-title>
          <uri>https://www.gwdg.de/</uri>
        </element-citation>
      </ref>
      <ref id="B8006538">
        <element-citation publication-type="other">
          <person-group person-group-type="author">
            <anonymous/>
          </person-group>
          <year>2022</year>
          <article-title>Helmholtz Metadata Collaboration Platform</article-title>
          <uri>https://helmholtz-metadaten.de/en</uri>
        </element-citation>
      </ref>
      <ref id="B8006516">
        <element-citation publication-type="other">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pfeil</surname>
              <given-names>Andreas</given-names>
            </name>
          </person-group>
          <year>2022</year>
          <article-title>FAIR DO Lab</article-title>
          <uri>https://github.com/kit-data-manager/testbed4inf</uri>
        </element-citation>
      </ref>
      <ref id="B8006508">
        <element-citation publication-type="other">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pfeil</surname>
              <given-names>Andreas</given-names>
            </name>
          </person-group>
          <year>2022</year>
          <article-title>Typed PID Maker</article-title>
          <uri>https://github.com/kit-data-manager/pit-service</uri>
        </element-citation>
      </ref>
      <ref id="B8006524">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weigel</surname>
              <given-names>Tobias</given-names>
            </name>
            <name name-style="western">
              <surname>Plale</surname>
              <given-names>Beth</given-names>
            </name>
            <name name-style="western">
              <surname>Parsons</surname>
              <given-names>Mark</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Gabriel</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Yu</given-names>
            </name>
            <name name-style="western">
              <surname>Schwardmann</surname>
              <given-names>Ulrich</given-names>
            </name>
            <name name-style="western">
              <surname>Quick</surname>
              <given-names>Robert</given-names>
            </name>
            <name name-style="western">
              <surname>Hellström</surname>
              <given-names>Margareta</given-names>
            </name>
            <name name-style="western">
              <surname>Kurakawa</surname>
              <given-names>Kei</given-names>
            </name>
          </person-group>
          <year>2018</year>
          <article-title>RDA Recommendation on PID Kernel Information</article-title>
          <source>Online</source>
          <uri>https://www.rd-alliance.org/group/pid-kernel-information-wg/outcomes/recommendation-pid-kernel-information</uri>
          <pub-id pub-id-type="doi">10.15497/RDA00031</pub-id>
        </element-citation>
      </ref>
    </ref-list>
  </back>
  <floats-group>
    <fig id="F8006394" position="float" orientation="portrait">
      <object-id content-type="arpha">99C4CE26-9D38-5234-A899-E0CB6227DEAA</object-id>
      <object-id content-type="doi">10.3897/rio.8.e94758.figure1</object-id>
      <label>Figure 1.</label>
      <caption>
        <p>Architecture of the FAIR DO demonstrator.</p>
      </caption>
      <graphic xlink:href="rio-08-e94758-g001.png" position="float" id="oo_712612.png" orientation="portrait" xlink:type="simple">
        <uri content-type="original_file">https://binary.pensoft.net/fig/712612</uri>
      </graphic>
    </fig>
  </floats-group>
</article>
