<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//TaxonX//DTD Taxonomic Treatment Publishing DTD v0 20100105//EN" "../../nlm/tax-treatment-NS0.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:tp="http://www.plazi.org/taxpub" article-type="research-article">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">17</journal-id>
      <journal-id journal-id-type="index">urn:lsid:arphahub.com:pub:8E638694-B4E0-570A-856A-746FF325BF6B</journal-id>
      <journal-title-group>
        <journal-title xml:lang="en">Research Ideas and Outcomes</journal-title>
        <abbrev-journal-title xml:lang="en">RIO</abbrev-journal-title>
      </journal-title-group>
      <issn pub-type="epub">2367-7163</issn>
      <publisher>
        <publisher-name>Pensoft Publishers</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.3897/rio.6.e54106</article-id>
      <article-id pub-id-type="publisher-id">54106</article-id>
      <article-id pub-id-type="manuscript">13366</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Research Idea</subject>
        </subj-group>
        <subj-group subj-group-type="sdg">
          <subject>Industry</subject>
          <subject> innovation &amp;amp; infrastructure</subject>
          <subject>Partnerships for the goals</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A virtual “Werkstatt” for digitization in the sciences</article-title>
      </title-group>
      <contrib-group content-type="authors">
        <contrib contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Samuel</surname>
            <given-names>Sheeba</given-names>
          </name>
          <email xlink:type="simple">sheeba.samuel@uni-jena.de</email>
          <uri content-type="orcid">https://orcid.org/0000-0002-7981-8504</uri>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A2">2</xref>
        </contrib>
        <contrib contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Shadaydeh</surname>
            <given-names>Maha</given-names>
          </name>
          <email xlink:type="simple">maha.shadaydeh@uni-jena.de</email>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A3">3</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Böcker</surname>
            <given-names>Sebastian</given-names>
          </name>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A4">4</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Brügmann</surname>
            <given-names>Bernd</given-names>
          </name>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A5">5</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Bucher</surname>
            <given-names>Solveig Franziska</given-names>
          </name>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A6">6</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Deckert</surname>
            <given-names>Volker</given-names>
          </name>
          <xref ref-type="aff" rid="A7">7</xref>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A8">8</xref>
          <xref ref-type="aff" rid="A9">9</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Denzler</surname>
            <given-names>Joachim</given-names>
          </name>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A3">3</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Dittrich</surname>
            <given-names>Peter</given-names>
          </name>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A10">10</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>von Eggeling</surname>
            <given-names>Ferdinand</given-names>
          </name>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A11">11</xref>
          <xref ref-type="aff" rid="A12">12</xref>
          <xref ref-type="aff" rid="A13">13</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Güllmar</surname>
            <given-names>Daniel</given-names>
          </name>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A14">14</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Guntinas-Lichius</surname>
            <given-names>Orlando</given-names>
          </name>
          <uri content-type="orcid">https://orcid.org/0000-0001-9671-0784</uri>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A11">11</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>König-Ries</surname>
            <given-names>Birgitta</given-names>
          </name>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A2">2</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Löffler</surname>
            <given-names>Frank</given-names>
          </name>
          <uri content-type="orcid">https://orcid.org/0000-0001-6643-6323</uri>
          <xref ref-type="aff" rid="A2">2</xref>
          <xref ref-type="aff" rid="A15">15</xref>
          <xref ref-type="aff" rid="A1">1</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Maicher</surname>
            <given-names>Lutz</given-names>
          </name>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A16">16</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Marz</surname>
            <given-names>Manja</given-names>
          </name>
          <xref ref-type="aff" rid="A17">17</xref>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A18">18</xref>
          <xref ref-type="aff" rid="A19">19</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Migliavacca</surname>
            <given-names>Mirco</given-names>
          </name>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A20">20</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>R. Reichenbach</surname>
            <given-names>Jürgen</given-names>
          </name>
          <uri content-type="orcid">https://orcid.org/0000-0002-2640-0630</uri>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A14">14</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Reichstein</surname>
            <given-names>Markus</given-names>
          </name>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A21">21</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Römermann</surname>
            <given-names>Christine</given-names>
          </name>
          <xref ref-type="aff" rid="A22">22</xref>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A6">6</xref>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name name-style="western">
            <surname>Wittig</surname>
            <given-names>Andrea</given-names>
          </name>
          <xref ref-type="aff" rid="A1">1</xref>
          <xref ref-type="aff" rid="A23">23</xref>
        </contrib>
      </contrib-group>
      <aff id="A1">
        <label>1</label>
        <addr-line content-type="verbatim">Michael Stifel Center Jena for Data-driven and Simulation Science, Jena, Germany</addr-line>
        <institution>Michael Stifel Center Jena for Data-driven and Simulation Science</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A2">
        <label>2</label>
        <addr-line content-type="verbatim">Heinz-Nixdorf Chair for Distributed Information Systems, Friedrich Schiller University Jena, Jena, Germany</addr-line>
        <institution>Heinz-Nixdorf Chair for Distributed Information Systems, Friedrich Schiller University Jena</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A3">
        <label>3</label>
        <addr-line content-type="verbatim">Department of Mathematics and Computer Science, Friedrich Schiller University Jena, Jena, Germany</addr-line>
        <institution>Department of Mathematics and Computer Science, Friedrich Schiller University Jena</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A4">
        <label>4</label>
        <addr-line content-type="verbatim">Chair of Bioinformatics, Institute of Computer Science, Friedrich Schiller University Jena, Jena, Germany</addr-line>
        <institution>Chair of Bioinformatics, Institute of Computer Science, Friedrich Schiller University Jena</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A5">
        <label>5</label>
        <addr-line content-type="verbatim">Institute for Theoretical Physics, Friedrich Schiller University Jena, Jena, Germany</addr-line>
        <institution>Institute for Theoretical Physics, Friedrich Schiller University Jena</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A6">
        <label>6</label>
        <addr-line content-type="verbatim">Plant Biodiversity, Institute of Ecology and Evolution with Botanical Garden and Herbarium Haussknecht, Friedrich Schiller University Jena, Jena, Germany</addr-line>
        <institution>Plant Biodiversity, Institute of Ecology and Evolution with Botanical Garden and Herbarium Haussknecht, Friedrich Schiller University Jena</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A7">
        <label>7</label>
        <addr-line content-type="verbatim">Institute of Quantum Science and Engineering, Texas A&amp;M, College Station, United States of America</addr-line>
        <institution>Institute of Quantum Science and Engineering, Texas A&amp;M</institution>
        <addr-line content-type="city">College Station</addr-line>
        <country>United States of America</country>
      </aff>
      <aff id="A8">
        <label>8</label>
        <addr-line content-type="verbatim">Leibniz Institute of Photonic Technology, Jena, Germany</addr-line>
        <institution>Leibniz Institute of Photonic Technology</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A9">
        <label>9</label>
        <addr-line content-type="verbatim">Institute of Physical Chemistry, Friedrich Schiller University Jena, Jena, Germany</addr-line>
        <institution>Institute of Physical Chemistry, Friedrich Schiller University Jena</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A10">
        <label>10</label>
        <addr-line content-type="verbatim">Bio System Analysis Group, Institute of Computer Science, Friedrich Schiller University Jena, Jena, Germany</addr-line>
        <institution>Bio System Analysis Group, Institute of Computer Science, Friedrich Schiller University Jena</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A11">
        <label>11</label>
        <addr-line content-type="verbatim">Department of Otorhinolaryngology, Jena University Hospital, Jena, Germany</addr-line>
        <institution>Department of Otorhinolaryngology, Jena University Hospital</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A12">
        <label>12</label>
        <addr-line content-type="verbatim">DFG Core Unit Jena Biophotonic and Imaging Laboratory (JBIL), Jena, Germany</addr-line>
        <institution>DFG Core Unit Jena Biophotonic and Imaging Laboratory (JBIL)</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A13">
        <label>13</label>
        <addr-line content-type="verbatim">Core Unit Proteome Analysis, Jena, Germany</addr-line>
        <institution>Core Unit Proteome Analysis</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A14">
        <label>14</label>
        <addr-line content-type="verbatim">Medical Physics Group, Department of Diagnostic and Interventional Radiology, University Hospital Jena, Jena, Germany</addr-line>
        <institution>Medical Physics Group, Department of Diagnostic and Interventional Radiology, University Hospital Jena</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A15">
        <label>15</label>
        <addr-line content-type="verbatim">Center for Computation and Techn., Louisiana State University, Baton Rouge, United States of America</addr-line>
        <institution>Center for Computation and Techn., Louisiana State University</institution>
        <addr-line content-type="city">Baton Rouge</addr-line>
        <country>United States of America</country>
      </aff>
      <aff id="A16">
        <label>16</label>
        <addr-line content-type="verbatim">Technology Transfer Research Group, Friedrich Schiller University Jena, Jena, Germany</addr-line>
        <institution>Technology Transfer Research Group, Friedrich Schiller University Jena</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A17">
        <label>17</label>
        <addr-line content-type="verbatim">European Virus Bioinformatics Center, Jena, Germany</addr-line>
        <institution>European Virus Bioinformatics Center</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A18">
        <label>18</label>
        <addr-line content-type="verbatim">RNA Bioinformatics and High-Throughput Analysis, Friedrich Schiller University Jena, Jena, Germany</addr-line>
        <institution>RNA Bioinformatics and High-Throughput Analysis, Friedrich Schiller University Jena</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A19">
        <label>19</label>
        <addr-line content-type="verbatim">FLI Leibniz Institute for Age Research, Jena, Germany</addr-line>
        <institution>FLI Leibniz Institute for Age Research</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A20">
        <label>20</label>
        <addr-line content-type="verbatim">Biosphere-Atmosphere Interactions and Experimentation Group, Department Biogeochemical Integration, Max Planck Institute for Biogeochemistry, Jena, Germany</addr-line>
        <institution>Biosphere-Atmosphere Interactions and Experimentation Group, Department Biogeochemical Integration, Max Planck Institute for Biogeochemistry</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A21">
        <label>21</label>
        <addr-line content-type="verbatim">Max Planck Institute for Biogeochemistry, Jena, Germany</addr-line>
        <institution>Max Planck Institute for Biogeochemistry</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A22">
        <label>22</label>
        <addr-line content-type="verbatim">German Centre for Integrative Biodiversity Research (iDiv), Halle-Jena-Leipzig, Germany</addr-line>
        <institution>German Centre for Integrative Biodiversity Research (iDiv)</institution>
        <addr-line content-type="city">Halle-Jena-Leipzig</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="A23">
        <label>23</label>
        <addr-line content-type="verbatim">Department of Radiotherapy and Radiation Oncology , University Hospital Jena,   Friedrich Schiller University Jena, Jena, Germany</addr-line>
        <institution>Department of Radiotherapy and Radiation Oncology , University Hospital Jena,   Friedrich Schiller University Jena</institution>
        <addr-line content-type="city">Jena</addr-line>
        <country>Germany</country>
      </aff>
      <author-notes>
        <fn fn-type="corresp">
          <p>Corresponding authors: Sheeba Samuel (<email xlink:type="simple">sheeba.samuel@uni-jena.de</email>), Maha Shadaydeh (<email xlink:type="simple">maha.shadaydeh@uni-jena.de</email>).</p>
        </fn>
        <fn fn-type="edited-by">
          <p>Academic editor: </p>
        </fn>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>11</day>
        <month>05</month>
        <year>2020</year>
      </pub-date>
      <volume>6</volume>
      <elocation-id>e54106</elocation-id>
      <uri content-type="arpha" xlink:href="http://openbiodiv.net/E935203A-5FB0-5E07-B1B5-072FCC5C7108">E935203A-5FB0-5E07-B1B5-072FCC5C7108</uri>
      <history>
        <date date-type="received">
          <day>09</day>
          <month>05</month>
          <year>2020</year>
        </date>
      </history>
      <permissions>
        <copyright-statement>Sheeba Samuel, Maha Shadaydeh, Sebastian Böcker, Bernd Brügmann, Solveig Franziska Bucher, Volker Deckert, Joachim Denzler, Peter Dittrich, Ferdinand von Eggeling, Daniel Güllmar, Orlando Guntinas-Lichius, Birgitta König-Ries, Frank Löffler, Lutz Maicher, Manja Marz, Mirco Migliavacca, Jürgen R. Reichenbach, Markus Reichstein, Christine Römermann, Andrea Wittig</copyright-statement>
        <license license-type="creative-commons-attribution" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
          <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution License (CC BY 4.0), which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
        </license>
      </permissions>
      <abstract>
        <label>Abstract</label>
        <p>Data is central in almost all scientific disciplines nowadays. Furthermore, intelligent systems have developed rapidly in recent years, so that in many disciplines the expectation is emerging that with the help of intelligent systems, significant challenges can be overcome and science can be done in completely new ways. In order for this to succeed, however, first, fundamental research in computer science is still required, and, second, generic tools must be developed on which specialized solutions can be built. In this paper, we introduce a recently started collaborative project funded by the Carl Zeiss Foundation, a virtual manufactory for digitization in the sciences, the “Werkstatt”, which is being established at the Michael Stifel Center Jena (MSCJ) for data-driven and simulation science to address fundamental questions in computer science and applications. The Werkstatt focuses on three key areas, which include generic tools for machine learning, knowledge generation using machine learning processes, and semantic methods for the data life cycle, as well as the application of these topics in different disciplines. Core and pilot projects address the key aspects of the topics and form the basis for sustainable work in the Werkstatt.</p>
      </abstract>
      <kwd-group>
        <label>Keywords</label>
        <kwd>Machine learning</kwd>
        <kwd>semantic methods</kwd>
        <kwd>data management</kwd>
      </kwd-group>
      <funding-group>
        <award-group>
          <funding-source>
            <named-content content-type="funder_name">Carl-Zeiss-Stiftung</named-content>
            <named-content content-type="funder_identifier">100007569</named-content>
            <named-content content-type="funder_doi">http://doi.org/10.13039/100007569</named-content>
          </funding-source>
        </award-group>
      </funding-group>
      <counts>
        <fig-count count="1"/>
        <table-count count="1"/>
        <ref-count count="39"/>
      </counts>
    </article-meta>
    <notes>
      <sec sec-type="Funding program">
        <title>Funding program</title>
        <p>Breakthroughs</p>
      </sec>
      <sec sec-type="Hosting institution">
        <title>Hosting institution</title>
        <p>Friedrich Schiller University Jena, Germany</p>
      </sec>
    </notes>
  </front>
  <body>
    <sec sec-type="Overview and background">
      <title>Overview and background</title>
      <p>Data plays an increasingly important role in many scientific disciplines. They are produced almost everywhere, but their use is still limited. This is mostly due to the fact that in many cases manual analysis is no longer possible due to the large data volume, and automatic analysis is not yet possible due to the lack of tools and/or expertise by the scientists. Here, intelligent systems combined with machine learning promise a solution on how to extract knowledge and how to carry out different steps in the process of the data life cycle from data generation and analysis to storage and subsequent use. This can be done either fully automatically or in collaboration between human and machine. For this vision to become reality, essential challenges need to be tackled. In this paper, we provide an overview of a recently launched project, the digitization “Werkstatt*<xref ref-type="fn" rid="FN5540622">1</xref>,” which aims to contribute in two ways: On the one hand, pilot projects create the opportunity for scientific breakthroughs in three key areas: (1) Fundamentals of generic tools for machine learning, (2) Integration of domain knowledge in machine learning, the explanation of results, as well as the analysis of causality and (3) Semantic methods for data lifecycle support. Findings in these areas are then applied to different application areas, which range from physics, bioinformatics, biology, to biomedicine. On the other hand, the “Werkstatt” offers the structural framework for sustainable, continuous interdisciplinary work in all areas of digitization in the city of Jena. Fig. <xref ref-type="fig" rid="F5540620">1</xref> shows the integration of the ”Werkstatt” into Friedrich Schiller University (FSU Jena) and the research location Jena. Here, researchers from different career levels, organizations, and backgrounds come together. Thus, an ideal framework has been created, within which all steps from the promotion of young scientists to the joint processing of challenging, fundamental research projects will take place. Besides, the “Werkstatt” will also be involved in other activities for the promotion of young talents and networking. To implement this strategy, among other things, annual retreats, joint teaching, and learning activities are planned.</p>
    </sec>
    <sec sec-type="Objectives">
      <title>Objectives</title>
      <p>The “Werkstatt” addresses the following three main research topics in computer science (T1-T3) as well as the application fields (T4):</p>
      <p>
        <bold>T1. Generic tools for machine learning</bold>
      </p>
      <p>An increasingly important topic within machine learning is its automation (AutoML). First steps are the preparation of the data, e.g., by transformation into suitable data formats, the treatment of missing values, or the correction of erroneous data entries. Moreover, most algorithms are highly parameterized and require a good choice of parameter values, e.g., the architecture of a deep neural network. The algorithm must be executed and its results analyzed, with the question of choosing appropriate metrics and measures of success. The analysis may require additional data to be collected later. These diverse, manual optimization steps usually require methodological expertise. Therefore, one goal is to adopt novel methods of AutoML design by using a systematic search. Another challenge for the successful use of machine learning is when the question to be answered by the data is not fixed a priori. One way to deal with this is to learn a flexible, generic model that a human analyst can examine with a suitable visual interface. For this purpose, due to their generality, multivariate probabilistic models are very suitable. A third important area for the development of generic tools for machine learning is the provision of automatic differentiation methods. Frequently, derivatives of an objective function to be optimized are required during learning. Automatic differentiation enables the automated generation of computer programs that calculate first or higher order derivatives of such target functions. However, typical target functions in machine learning have special structures that are not used in standard automatic differentiation methods. A goal that should, therefore, be pursued in this area is, in general, techniques of automatically distinguishing specific structures from the machine to adapt to learning. Such targeted program transformation could result in programs that require significantly less space or whose execution time is significantly shorter than general automatic differentiation techniques.</p>
      <p>
        <bold>T2. Knowledge generation using machine learning processes</bold>
      </p>
      <p>Machine learning methods, in particular supervised learning methods, have been able to learn input/output relationships from data for years and thus solve problems such as classification or regression tasks with high accuracy. In the field of image and scene analysis, the achieved accuracy reaches or surpasses the performance of humans (<xref ref-type="bibr" rid="B5528958">Taigman et al. 2014</xref>).</p>
      <p>With all the advances in generating the correct input/output relationship, challenging issues still exist in data-driven solutions. Scientists who want to generate knowledge from data, would like to make a model refinement via data-model integration and if necessary, switch between hypothesis- and data-driven procedures. Despite the tremendous power of deep neural networks, the following questions are still open and need extensive research efforts: a) Can the machine learning process be understood and reconstructed? b) Is it possible to detect cause-effect relationships by data-driven methods and thus to identify causal relationships for example in multivariate time series? c) How to integrate knowledge about, e.g., physical laws, with a data-driven approach to improve the approximation accuracy of the data estimated model and at the same time reduce the effort required for training (data collection, data annotation, the number of learning steps, etc.)? d) Can a large amount of annotated training data, which are still required for many approaches, be reduced in order to open up new fields of applications, in which such data collection is currently too expensive or completely impossible? In this Werkstatt, we aim to add new contributions to the line of tackling these issues. The main focus will be on the development of unsupervised learning methods as well as data-driven solutions for causal inference in dynamical systems.</p>
      <p>
        <bold>T3. Semantic methods for the data life cycle</bold>
      </p>
      <p>The added value of digitizing the research processes arises not only when the individual steps are improved by intelligent systems, but also when integrated support exists throughout the entire scientific (or data) life cycle. Semantic methods offer promising approaches here. An essential component of digitization of research processes is a precise and machine-understandable description of the experimental data, which helps in the retrieval and re-use of data, the reproducibility of the results, and more generally, scientific progress. However, scientists are reluctant to provide the descriptions because this requires high effort and time. One goal of this topic is to investigate how experiment data can be semi-automatically annotated with semantic metadata with the support of artificial intelligence. Another aspect is the role of data curation and data quality control in this environment. The quality of the research results depends heavily on the quality of the data. However, in the face of a rapidly growing amount of data, the major dilemma is that a high curation level for all the data is not realistic and not cost-effective. In this Werkstatt, we aim to develop novel methods for determining the data value and integrate the methods for the control of curation processes into systems. The main focus will be on the construction and maintenance of knowledge graphs.</p>
      <p>
        <bold>T4. Applications</bold>
      </p>
      <p>The methods developed in T1-T3 are intended to be used, evaluated and optimized directly in fields of application and enable discipline-specific breakthroughs. The development of fundamentals in machine learning and data management in the sciences can only be successful in close cooperation between computer science and the respective disciplines.</p>
    </sec>
    <sec sec-type="Impact">
      <title>Impact</title>
      <p>Digitization and data-driven sciences have very high priority in the strategic planning of the FSU Jena. Research on intelligent systems is of importance for all three research foci, called "profile lines'" of the FSU "Light, Life, Liberty". As early as 2015, the MSCJ was established as a cross-sectional structure. The MSCJ consists of scientists from seven faculties and three non-university research institutes in Jena (Max Planck Institute for Biogeochemistry, Max Planck Institute for Human History, DLR Institute for Data Science). This project aims to contribute to the strengthening of this structure through the development of the Werkstatt, which will facilitate cooperation both between different areas within computer science and specialist sciences, across organizations and across all career stages.</p>
      <p>The structural goal of the project is the networking and expansion of the relevant expertise, the establishment of know-how on intelligent systems in as many specialist disciplines as possible, and the establishment of stable cooperations, thereby opening up the possibility of initiating further third-party funded projects.</p>
    </sec>
    <sec sec-type="Implementation">
      <title>Implementation</title>
      <p>The Werkstatt comprises three core projects and ten pilot projects based on the objective areas. It also comprises activities for international networking and local communications as well as promotion of young talents. In each of the three subject areas, a five years core project is being conducted, each with one postdoctoral researcher. The three core projects shall ensure methodological continuity and also support the pilot projects with expertise and tools. The pilot projects run for three years; each is equipped with one PhD student. There will be a second, somewhat smaller set of pilot projects starting in year three of the Werkstatt. Table <xref ref-type="table" rid="T5545429">1</xref> provides an overview of the core projects (C1-C3) and the current pilot projects (P1-P10) and their coverage of the four themes. The core projects are:</p>
      <p>
        <bold>C1: Automatic machine learning</bold>
      </p>
      <p>In order to use today’s powerful machine learning systems even without detailed machine learning knowledge, e.g., the meaning and effects of the involved hyperparameters, tools for automating the entire process of data analysis and machine learning are necessary. At the very least, one would like to assist a human analyst with the help of machine tools to process the individual steps. The aim of this core project is the further development of methods from the area of AutoML. AutoML is looking for automatic or semi-automatic methods for (1.) data preparation and transformation, (2.) selection of suitable analysis algorithms, (3.) execution of the algorithm, (4.) determination of good hyperparameters of the machine learning algorithms, (5.) selection of measures of success, (6.) data collection of missing data, and (7.) report generation.</p>
      <p>
        <bold>C2: Generative models</bold>
      </p>
      <p>Deep learning methods achieve their remarkable performance from a very large amount of annotated training data. However, in many applications in the sciences, e.g. in medicine, the annotation by the user/expert is very expensive or completely impossible. This core project therefore deals with modern, unsupervised learning methods and their application in the sciences. Specifically, methods for learning generative models, such as e.g. Generative Adversarial Networks (<xref ref-type="bibr" rid="B5529726">Goodfellow et al. 2014</xref>), are examined and expanded so that, for example, unsupervised methods for anomaly detection can be developed. In addition, such models might also be used for data augmentation, i. e. to generate additional training data, or be the basis for estimating and subsequently analysing the underlying data distribution. This core project supports two pilot projects, P2: Detection of causal relationships through deep learning, and P3: Data-driven virus diagnostics at multiple levels I (Methods).</p>
      <p>
        <bold>C3: Integrated provenance management</bold>
      </p>
      <p>One of the essential requirements of scientific experiments is that they are reproducible. For the reproducibility of results, it is important that the experiments are described in a structured way which contains information about the experimental setup and procedure. In recent years, a large number of domain ontologies have been created in numerous application disciplines, which formally model sections of the respective field (see, for example, the NCBI BioPortal with almost 700 ontologies). The expectation is that with the help of these ontologies, finding and linking data can be significantly improved (<xref ref-type="bibr" rid="B5529922">Walls et al. 2014</xref>, <xref ref-type="bibr" rid="B5529875">Klan et al. 2017</xref>). Analogous to the development of domain ontologies for the formal description of data, different approaches to the formal process description have emerged. This includes the provenance ontology PROV-O (<xref ref-type="bibr" rid="B5529895">Lebo et al. 2013</xref>). An extension, REPRODUCE-ME ontology (<xref ref-type="bibr" rid="B5529076">Samuel et al. 2018</xref>) is intended to describe end-to-end provenance of scientific experiments. Independent of these approaches for modeling scientific workflows, first suggestions were published on how such a description for experimental steps using machine learning could look like (<xref ref-type="bibr" rid="B5529911">Schelter et al. 2018</xref>). However, there is no integration of the descriptions of different types of experiment steps, as well as procedures for the further automation of provenance recording and for the use of these descriptions. This gap should be addressed here. The goal of this project is to develop an integrated semi-automatic approach for the management of provenance with human and machine-understandable descriptions which can be used for different purposes.</p>
      <p>The tools developed in these three core projects will be applied in the following ten pilot projects:</p>
      <p>
        <bold>P1: Probabilistic modeling</bold>
      </p>
      <p>In this project, new generic algorithms for learning multivariate probabilistic models are to be developed. To this end, the convex programming approach of <xref ref-type="bibr" rid="B5530661">Chandrasekaran et al. (2012a)</xref> and <xref ref-type="bibr" rid="B5530671">Chandrasekaran et al. (2012b)</xref> is to be extended to mixed distributions. On the one hand, it should be examined whether the theoretical consistency analysis of the optimization approach also applies in this more general framework, on the other hand, this approach should be implemented. A scalable implementation is a non-trivial endeavor since the modeling will likely include group norms above the cone of positive semi-definite matrices, for which there is no standard software. In addition, for an effective implementation an appropriate search strategy based on the regularization parameters of the problem is required. For this purpose, methods from vector optimization are to be developed further. The possible applications of the learned, mixed distributions are diverse. They range from the direct modeling of data from mixed feature spaces to the support of an explorative, interactive analysis of multivariate data sets.</p>
      <p>
        <bold>P2: Detection of causal relationships using deep learning</bold>
      </p>
      <p>Understanding causal effects in dynamic systems plays an important role in numerous disciplines such as economy (<xref ref-type="bibr" rid="B5530506">Granger 1969</xref>), neuroscience (<xref ref-type="bibr" rid="B5530496">Seth et al. 2015</xref>), climate and ecosystems (<xref ref-type="bibr" rid="B5545373">Runge et al. 2019</xref>, <xref ref-type="bibr" rid="B5545341">Shadaydeh et al. 2019</xref>, <xref ref-type="bibr" rid="B5545361">Trifunov et al. 2019</xref>) among many others. The inference of unknown causal effect relationships between the variables of a complex dynamical system from large amounts of data allows for gaining further knowledge on the system’s behaviour. Machine learning methods often attempt to model joint distributions of sets of variables, with the objective of estimating the likely values of certain variables given observations of others. However, modelling joint distributions is not sufficient to make inferences about the values of some variables when other variables are manipulated. The later problem requires an understanding of the cause-effect relationships between the variables (<xref ref-type="bibr" rid="B5530516">Peters et al. 2017</xref>, <xref ref-type="bibr" rid="B5530559">Pearl 2009</xref>). The aim of this project is to investigate to what extent causal relationships in multivariate nonlinear dynamical systems can be derived from learned, deep networks. This will also allow for better insights into the functioning of deep networks and integrates causal relationships in a constructive way. The developed methods will be used and implemented in important and generic tools of the Werkstatt.</p>
      <p>
        <bold>P3: Data-driven virus diagnostics at multiple levels I (Methods)</bold>
      </p>
      <p>This project aims to develop new data analysis and learning methods to improve the diagnosis of known and unknown viruses and their interaction with other pathogens. We start from three complex data streams: sequences (genome and transcriptome of virus and host), images (virus, through TERS technology newly developed in Jena), and molecular spectra (mass spectra of virus and host), which are always cheaper and available in large quantities. We will develop new methods of machine learning and stochastic inference for the metabolomics of viral infections (molecular level). The development is based on our methods (SIRIUS, CSI: FingerID) for gas chromatography and electron ionization. We will develop learning and classification methods that use knowledge of the biological system (virus/ host) in the form of dynamic reaction networks (network level). The learning should take place both by adapting kinetic parameters and by adapting (learning) the network structure through a new form of genetic programming (CMAES-GEGP). At the molecular level and network level, knowledge is generated in the form of learned models, which should then be used for diagnostics.</p>
      <p>
        <bold>P4: Data value oriented curation processes</bold>
      </p>
      <p>The creation and continuous update of large knowledge bases (mainly as knowledge graphs or factual databases) is a common scenario in various disciplines, like Digital Humanities (<xref ref-type="bibr" rid="B5571979">Haslhofer et al. 2018</xref>, <xref ref-type="bibr" rid="B5571895">Maicher et al. 2009</xref>), Citizen Science (<xref ref-type="bibr" rid="B5571946">Bonney et al. 2014</xref>), biodiversity research (<xref ref-type="bibr" rid="B5571908">Nadrowski et al. 2012</xref>) or even economics and managerial sciences (<xref ref-type="bibr" rid="B5571969">Dalle et al. 2017</xref>). In most cases, these knowledge graphs are a curated collection of observational data. Usually, the creation of the knowledge graphs is based on various heterogeneous data sources, integrated and augmented through automatic and semi-automatic approaches, usually combined with manual inputs, curations and amendments. One of the main challenges is the continuous update of the knowledge graphs, irrespective of whether one dozen facts are updated a day, or hundreds of thousands. Data quality aspects like incompleteness, inconsistency, and scalability of curation are central issues hereby (<xref ref-type="bibr" rid="B5571927">Lukyanenko et al. 2016</xref>). Existing rigorous data quality assurance approaches are limited in scenarios where contributions to the knowledge graph are more accidental, fragmented, and voluntary, as it can be expected in citizen science or other crowdsourcing scenarios. Within the Werkstatt, we will experiment with a new approach for data quality assurance: data-value oriented curation processes. Our approach assumes and accepts that the knowledge graph is always imperfect. But defines the requirements on the knowledge graph, to be fulfilled for realizing the functionality (hence: the value) based on this data. In a second step, we implement a system, which continuously observes the level of fulfillment of these data quality requirements (<xref ref-type="bibr" rid="B5571937">Prilop 2014</xref>). In a third step, these measurements on the fulfillment of the requirements automatically inform a workflow system, which guides and priorities the work of all authors and curators of the knowledge graph. By applying this approach, we expect with the given human resources the highest value for research or applications can be extracted from continuously updated knowledge graphs.</p>
      <p>
        <bold>P5: Learning of data annotations</bold>
      </p>
      <p>In many scientific disciplines, sharing data and reusing it in different contexts becomes more and more important. In order for such re-use to be truly successful, a good, ideally machine-readable description of the data is essential. However, today, creating such descriptions requires considerable manual effort. This project aims to utilize and extend machine learning techniques in creating the semantic annotations for existing datasets thus considerably reducing effort and enabling the reuse of untapped resources. Different data sources from the Biodiversity domain will be processed, with the ultimate goal to expose them as a semantic knowledge graph. To build this graph, we aim to combine different sources of information about any given dataset including the (tabular) dataset itself, existing metadata and abstracts or full texts of associated publications.</p>
      <p>
        <bold>P6: Deep learning for data analysis in gravitational wave astronomy</bold>
      </p>
      <p>The so-called Phenom-models (<xref ref-type="bibr" rid="B5530751">Ajith et al. 2011</xref>), one of the two standard methods for the analysis of the first gravitational wave signal (<xref ref-type="bibr" rid="B5547023">Abbott and et al. 2016</xref>), were established by hand. In this project, these models will be significantly improved by self-learning algorithms. Essential for methods of this sort are analytical and numerical gravitational wave templates, being computed in Jena for different sources such as black holes and neutron stars.</p>
      <p>The goal is to combine the current wave templates for concrete physical problems with new machine learning methods for data analysis. Since this field of research has only just started to attract international attention (<xref ref-type="bibr" rid="B5530769">George and Huerta 2018</xref>, <xref ref-type="bibr" rid="B5530779">Shen et al. 2017</xref>), the integration into the large framework of the MSCJ, involving both physicists and computer scientists, will play an important and fruitful role.</p>
      <p>
        <bold>P7: Combined analysis of image data of head and neck cancer</bold>
      </p>
      <p>Large multimodal image datasets accumulate before, during, and after therapy of head and neck cancer. The data mainly arise from endoscopic and microscopic images gained during surgery, histopathological images from tissue samples, proteomic data from MALDI imaging, as well as pre-therapeutical and post-therapeutical radiological imaging data used for tumor staging and therapy control (computed tomography, positron emission tomography, magnetic resonance imaging). So far, these different image data sources are not linked to each other, although it has been shown that the combined analysis of such data allows a much better prediction of tumor control and outcome (<xref ref-type="bibr" rid="B5530240">von Eggeling et al. 2012</xref>, <xref ref-type="bibr" rid="B5530251">Bogowicz et al. 2017b</xref>, <xref ref-type="bibr" rid="B5530267">Bogowicz et al. 2017a</xref>, <xref ref-type="bibr" rid="B5530280">Oetjen et al. 2013</xref>). Aim of pilot project P7 therefore is the aggregation of all data collected during the patient’s therapy on a common platform. The data will be analyzed with machine learning tools. The aim is the breakthrough for the development of more precise diagnostics and better therapy for head and neck cancer.</p>
      <p>
        <bold>P8: Use and reuse of MRI data in biomedical research environment</bold>
      </p>
      <p>Assessing the data quality of biomedical imaging data, and particularly MR imaging data, is an essential prerequisite for the preparation and application of big data methods in clinical science. Conventional approaches for evaluating the data quality of magnetic resonance imaging (MRI) data are largely limited to certain sub-aspects and are often contrast-specific (<xref ref-type="bibr" rid="B5552189">Vogelbacher et al. 2019</xref>). Quantitative MR contrasts, however, such as, e.g., quantitative susceptibility mapping (QSM) (<xref ref-type="bibr" rid="B5548917">Reichenbach et al. 2015</xref>) or quantitative diffusion imaging (<xref ref-type="bibr" rid="B5548927">Güllmar et al. 2017</xref>), require careful quality assessment before mapping. Holistic, contrast-independent procedures are currently missing. Against this background, the objectives of this project are as follows: (1) Identification of high quality, artifact-free data sets using image-based approaches; (2) Identification of potential bias factors in the datasets; (3) Consideration and/or correction of these factors; (4) Implementation of so-called image-derived phenotypes (IDPs). A future main area of application of such data could be the assessment of disease time courses based on previous knowledge, whereby the retrospective comparison data should be identified by using the IDPs.</p>
      <p>
        <bold>P9: Development, digitization and establishment of sensor-based phenological observations</bold>
      </p>
      <p>Monitoring biodiversity is one of the major tasks in the light of global change and was identified as such in the coalition agreement of the German government. Changes in phenology which are also referred to as “fingerprint of climate change” (<xref ref-type="bibr" rid="B5529774">Menzel and Fabian 1999</xref>, <xref ref-type="bibr" rid="B5529784">Parmesan and Yohe 2003</xref>, <xref ref-type="bibr" rid="B5529794">Root et al. 2003</xref>) lead to changes in biodiversity (<xref ref-type="bibr" rid="B5529806">Miller-Rushing and Primack 2008</xref>) and impact ecosystem services (e.g. provisioning of flowers for pollinators) on a landscape scale (<xref ref-type="bibr" rid="B5529816">Senapathi et al. 2015</xref>). In order to mitigate effects of climate change, an objective monitoring of ecosystems is important.</p>
      <p>The development of digitized, species-specific monitoring of phenological data in different ecosystems using sensors linked to automated image-analysis can be seen as a next step to objectively collect extensive data on plant phenology (BigData). This is not only important in the light of global change, but also offers the possibility of species-specific, automated monitoring in areas such as remote sensing and applied ecology.</p>
      <p>
        <bold>P10: Data-driven virus diagnostics at multiple levels II (application)</bold>
      </p>
      <p>In this project, modern analysis and learning methods are applied to achieve a breakthrough in virus diagnostics. It forms a unit with P3 (methods). On the experimental side, a fluidic chip system (artificial blood vessel) is used to infect host cells with influenza A viruses and secondarily with a pathogenic bacterium (MRSA) in a controlled manner. Furthermore, patient samples (urine, sputum, blood, BAL, CSF) from the University Hospital Jena are available and we have access to the CAPNETZ biobank with about 8000 serum samples. In the AG Marz new methods of real-time sequencing will be developed and applied (sequence level).</p>
      <p>Real-time detection will be achieved by the MinION system (Oxford Nanopore Technologies) recently established in Jena. The system has the dimensions of a USB stick and can also be used directly on the patient. The sequencing of host DNA/RNA will be automatically stopped in real-time and another DNA/RNA fragment will be sequenced instead. The sequencing platform has already been established and tested. The tip-enhanced Raman scattering (TERS) will be used for pathogen detection in complex samples (image plane). The group in Jena has already successfully detected viruses using TERS under defined conditions. Here, protocols are being developed that allow the detection of pathogens in complex patient samples. A combination of dark-field and AFM methods ensures a fast pre-characterization of the sample, which simplifies the actual TERS characterization. As a result, we expect that the new sequence level (P10), image level (P10), molecular level (P3) and network level (P3) methods will contribute to a significant improvement in individualized real-time diagnostics.</p>
    </sec>
  </body>
  <back>
    <ack>
      <title>Acknowledgements</title>
      <p>The authors thank the Carl Zeiss Foundation for the financial support within the scope of the program line "Breakthroughs: Exploring Intelligent Systems'' for "Digitization - explore the basics, use applications''.</p>
    </ack>
    <sec sec-type="Funding program">
      <title>Funding program</title>
      <p>Breakthroughs</p>
    </sec>
    <sec sec-type="Grant title">
      <title>Grant title</title>
      <p>A Virtual Werkstatt for Digitization in the Sciences</p>
    </sec>
    <sec sec-type="Hosting institution">
      <title>Hosting institution</title>
      <p>Friedrich Schiller University Jena, Germany</p>
    </sec>
    <ref-list>
      <title>References</title>
      <ref id="B5547023">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abbott</surname>
              <given-names>B. P.</given-names>
            </name>
            <name name-style="western">
              <surname>et al.</surname>
            </name>
          </person-group>
          <year>2016</year>
          <article-title>Properties of the binary black hole merger GW150914</article-title>
          <source>Physical Review Letters</source>
          <volume>116</volume>
          <fpage>241102</fpage>
          <pub-id pub-id-type="doi">10.1103/PhysRevLett.116.241102</pub-id>
        </element-citation>
      </ref>
      <ref id="B5530751">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ajith</surname>
              <given-names>P.</given-names>
            </name>
            <name name-style="western">
              <surname>Hannam</surname>
              <given-names>M.</given-names>
            </name>
            <name name-style="western">
              <surname>Husa</surname>
              <given-names>S.</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y.</given-names>
            </name>
            <name name-style="western">
              <surname>Brügmann</surname>
              <given-names>B.</given-names>
            </name>
            <name name-style="western">
              <surname>Dorband</surname>
              <given-names>N.</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>D.</given-names>
            </name>
            <name name-style="western">
              <surname>Ohme</surname>
              <given-names>F.</given-names>
            </name>
            <name name-style="western">
              <surname>Pollney</surname>
              <given-names>D.</given-names>
            </name>
            <name name-style="western">
              <surname>Reisswig</surname>
              <given-names>C.</given-names>
            </name>
            <name name-style="western">
              <surname>Santamaría</surname>
              <given-names>L.</given-names>
            </name>
            <name name-style="western">
              <surname>Seiler</surname>
              <given-names>J.</given-names>
            </name>
          </person-group>
          <year>2011</year>
          <article-title>Inspiral-merger-ringdown waveforms for black-hole binaries with non-precessing spins</article-title>
          <source>Physical Review Letters</source>
          <volume>106</volume>
          <fpage>241101</fpage>
          <pub-id pub-id-type="doi">10.1103/PhysRevLett.106.241101</pub-id>
        </element-citation>
      </ref>
      <ref id="B5530267">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bogowicz</surname>
              <given-names>Marta</given-names>
            </name>
            <name name-style="western">
              <surname>Riesterer</surname>
              <given-names>Oliver</given-names>
            </name>
            <name name-style="western">
              <surname>Stark</surname>
              <given-names>Luisa Sabrina</given-names>
            </name>
            <name name-style="western">
              <surname>Studer</surname>
              <given-names>Gabriela</given-names>
            </name>
            <name name-style="western">
              <surname>Unkelbach</surname>
              <given-names>Jan</given-names>
            </name>
            <name name-style="western">
              <surname>Guckenberger</surname>
              <given-names>Matthias</given-names>
            </name>
            <name name-style="western">
              <surname>Tanadini-Lang</surname>
              <given-names>Stephanie</given-names>
            </name>
          </person-group>
          <year>2017</year>
          <article-title>Comparison of PET and CT radiomics for prediction of local tumor control in head and neck squamous cell carcinoma</article-title>
          <source>Acta Oncologica</source>
          <volume>56</volume>
          <issue>11</issue>
          <fpage>1531</fpage>
          <lpage>1536</lpage>
          <pub-id pub-id-type="doi">10.1080/0284186x.2017.1346382</pub-id>
        </element-citation>
      </ref>
      <ref id="B5530251">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bogowicz</surname>
              <given-names>Marta</given-names>
            </name>
            <name name-style="western">
              <surname>Leijenaar</surname>
              <given-names>Ralph T. H.</given-names>
            </name>
            <name name-style="western">
              <surname>Tanadini-Lang</surname>
              <given-names>Stephanie</given-names>
            </name>
            <name name-style="western">
              <surname>Riesterer</surname>
              <given-names>Oliver</given-names>
            </name>
            <name name-style="western">
              <surname>Pruschy</surname>
              <given-names>Martin</given-names>
            </name>
            <name name-style="western">
              <surname>Studer</surname>
              <given-names>Gabriela</given-names>
            </name>
            <name name-style="western">
              <surname>Unkelbach</surname>
              <given-names>Jan</given-names>
            </name>
            <name name-style="western">
              <surname>Guckenberger</surname>
              <given-names>Matthias</given-names>
            </name>
            <name name-style="western">
              <surname>Konukoglu</surname>
              <given-names>Ender</given-names>
            </name>
            <name name-style="western">
              <surname>Lambin</surname>
              <given-names>Philippe</given-names>
            </name>
          </person-group>
          <year>2017</year>
          <article-title>Post-radiochemotherapy PET radiomics in head and neck cancer – The influence of radiomics implementation on the reproducibility of local control tumor models</article-title>
          <source>Radiotherapy and Oncology</source>
          <volume>125</volume>
          <issue>3</issue>
          <fpage>385</fpage>
          <lpage>391</lpage>
          <pub-id pub-id-type="doi">10.1016/j.radonc.2017.10.023</pub-id>
        </element-citation>
      </ref>
      <ref id="B5571946">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bonney</surname>
              <given-names>R.</given-names>
            </name>
            <name name-style="western">
              <surname>Shirk</surname>
              <given-names>J. L.</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>T. B.</given-names>
            </name>
            <name name-style="western">
              <surname>Wiggins</surname>
              <given-names>A.</given-names>
            </name>
            <name name-style="western">
              <surname>Ballard</surname>
              <given-names>H. L.</given-names>
            </name>
            <name name-style="western">
              <surname>Miller-Rushing</surname>
              <given-names>A. J.</given-names>
            </name>
            <name name-style="western">
              <surname>Parrish</surname>
              <given-names>J. K.</given-names>
            </name>
          </person-group>
          <year>2014</year>
          <article-title>Next steps for citizen science</article-title>
          <source>Science</source>
          <volume>343</volume>
          <issue>6178</issue>
          <fpage>1436</fpage>
          <lpage>1437</lpage>
          <pub-id pub-id-type="doi">10.1126/science.1251554</pub-id>
        </element-citation>
      </ref>
      <ref id="B5530661">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chandrasekaran</surname>
              <given-names>Venkat</given-names>
            </name>
            <name name-style="western">
              <surname>Parrilo</surname>
              <given-names>Pablo A.</given-names>
            </name>
            <name name-style="western">
              <surname>Willsky</surname>
              <given-names>Alan S.</given-names>
            </name>
          </person-group>
          <year>2012</year>
          <article-title>Latent variable graphical model selection via convex optimization</article-title>
          <source>The Annals of Statistics</source>
          <volume>40</volume>
          <issue>4</issue>
          <fpage>1935</fpage>
          <lpage>1967</lpage>
          <pub-id pub-id-type="doi">10.1214/11-AOS949</pub-id>
        </element-citation>
      </ref>
      <ref id="B5530671">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chandrasekaran</surname>
              <given-names>Venkat</given-names>
            </name>
            <name name-style="western">
              <surname>Parrilo</surname>
              <given-names>Pablo A.</given-names>
            </name>
            <name name-style="western">
              <surname>Willsky</surname>
              <given-names>Alan S.</given-names>
            </name>
          </person-group>
          <year>2012</year>
          <article-title>Rejoinder: Latent variable graphical model selection via convex optimization</article-title>
          <source>The Annals of Statistics</source>
          <volume>40</volume>
          <issue>4</issue>
          <fpage>2005</fpage>
          <lpage>2013</lpage>
          <pub-id pub-id-type="doi">10.1214/12-AOS1020</pub-id>
        </element-citation>
      </ref>
      <ref id="B5571969">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dalle</surname>
              <given-names>Jean-Michel</given-names>
            </name>
            <name name-style="western">
              <surname>Besten</surname>
              <given-names>Matthijs den</given-names>
            </name>
            <name name-style="western">
              <surname>Menon</surname>
              <given-names>Carlo</given-names>
            </name>
          </person-group>
          <year>2017</year>
          <article-title>Using Crunchbase for economic and managerial research</article-title>
          <source>OECD Science, Technology and Industry Working Papers</source>
          <pub-id pub-id-type="doi">10.1787/6c418d60-en</pub-id>
        </element-citation>
      </ref>
      <ref id="B5530769">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>George</surname>
              <given-names>Daniel</given-names>
            </name>
            <name name-style="western">
              <surname>Huerta</surname>
              <given-names>E. A.</given-names>
            </name>
          </person-group>
          <year>2018</year>
          <article-title>Deep neural networks to enable real-time multimessenger astrophysics</article-title>
          <source>Physical Review D</source>
          <volume>97</volume>
          <issue>4</issue>
        </element-citation>
      </ref>
      <ref id="B5529726">
        <element-citation publication-type="conference-preoceeding">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goodfellow</surname>
              <given-names>Ian J.</given-names>
            </name>
            <name name-style="western">
              <surname>Pouget-Abadie</surname>
              <given-names>Jean</given-names>
            </name>
            <name name-style="western">
              <surname>Mirza</surname>
              <given-names>Mehdi</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Bing</given-names>
            </name>
            <name name-style="western">
              <surname>Warde-Farley</surname>
              <given-names>David</given-names>
            </name>
            <name name-style="western">
              <surname>Ozair</surname>
              <given-names>Sherjil</given-names>
            </name>
            <name name-style="western">
              <surname>Courville</surname>
              <given-names>Aaron</given-names>
            </name>
            <name name-style="western">
              <surname>Bengio</surname>
              <given-names>Yoshua</given-names>
            </name>
          </person-group>
          <year>2014</year>
          <source>Generative adversarial nets</source>
          <conf-name>Proceedings of the 27th International Conference on Neural Information Processing Systems. Volume 2</conf-name>
        </element-citation>
      </ref>
      <ref id="B5530506">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Granger</surname>
              <given-names>C. W. J.</given-names>
            </name>
          </person-group>
          <year>1969</year>
          <article-title>Investigating causal relations by econometric models and cross-spectral methods</article-title>
          <source>Econometrica</source>
          <volume>37</volume>
          <issue>3</issue>
          <fpage>424</fpage>
          <lpage>438</lpage>
          <pub-id pub-id-type="doi">10.2307/1912791</pub-id>
        </element-citation>
      </ref>
      <ref id="B5548927">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Güllmar</surname>
              <given-names>Daniel</given-names>
            </name>
            <name name-style="western">
              <surname>Seeliger</surname>
              <given-names>Tabea</given-names>
            </name>
            <name name-style="western">
              <surname>Gudziol</surname>
              <given-names>Hilmar</given-names>
            </name>
            <name name-style="western">
              <surname>Teichgräber</surname>
              <given-names>Ulf KM</given-names>
            </name>
            <name name-style="western">
              <surname>Reichenbach</surname>
              <given-names>Jürgen R</given-names>
            </name>
            <name name-style="western">
              <surname>Guntinas-Lichius</surname>
              <given-names>Orlando</given-names>
            </name>
            <name name-style="western">
              <surname>Bitter</surname>
              <given-names>Thomas</given-names>
            </name>
          </person-group>
          <year>2017</year>
          <article-title>Improvement of olfactory function after sinus surgery correlates with white matter properties measured by diffusion tensor imaging</article-title>
          <source>Neuroscience</source>
          <volume>360</volume>
          <fpage>190</fpage>
          <lpage>196</lpage>
          <pub-id pub-id-type="doi">10.1016/j.neuroscience.2017.07.070</pub-id>
        </element-citation>
      </ref>
      <ref id="B5571979">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haslhofer</surname>
              <given-names>Bernhard</given-names>
            </name>
            <name name-style="western">
              <surname>Isaac</surname>
              <given-names>Antoine</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>Rainer</given-names>
            </name>
          </person-group>
          <year>2018</year>
          <article-title>Knowledge graphs in the libraries and digital humanities domain</article-title>
          <source>Encyclopedia of Big Data Technologies</source>
          <fpage>1</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-319-63962-8_291-1</pub-id>
        </element-citation>
      </ref>
      <ref id="B5529875">
        <element-citation publication-type="conference-preoceeding">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Klan</surname>
              <given-names>Friederike</given-names>
            </name>
            <name name-style="western">
              <surname>Faessler</surname>
              <given-names>Erik</given-names>
            </name>
            <name name-style="western">
              <surname>Algergawy</surname>
              <given-names>Alsayed</given-names>
            </name>
            <name name-style="western">
              <surname>König-Ries</surname>
              <given-names>Birgitta</given-names>
            </name>
            <name name-style="western">
              <surname>Hahn</surname>
              <given-names>Udo</given-names>
            </name>
          </person-group>
          <year>2017</year>
          <source>Integrated semantic search on structured and unstructured data in the ADOnIS system</source>
          <conf-name>Proceedings of the 2nd International Workshop on Semantics for Biodiversity co-located with 16th International Semantic Web Conference (ISWC 2017)</conf-name>
        </element-citation>
      </ref>
      <ref id="B5529895">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lebo</surname>
              <given-names>Timothy</given-names>
            </name>
            <name name-style="western">
              <surname>Sahoo</surname>
              <given-names>Satya</given-names>
            </name>
            <name name-style="western">
              <surname>McGuinness</surname>
              <given-names>Deborah</given-names>
            </name>
            <name name-style="western">
              <surname>Belhajjame</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Cheney</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Corsar</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Garijo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Soiland-Reyes</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zednik</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <year>2013</year>
          <article-title>PROV-O: The PROV Ontology, 2013</article-title>
          <source>W3C Recommendation</source>
          <uri>http://www.w3.org/TR/2013/REC-prov-o-20130430</uri>
        </element-citation>
      </ref>
      <ref id="B5571927">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lukyanenko</surname>
              <given-names>Roman</given-names>
            </name>
            <name name-style="western">
              <surname>Parsons</surname>
              <given-names>Jeffrey</given-names>
            </name>
            <name name-style="western">
              <surname>Wiersma</surname>
              <given-names>Yolanda F.</given-names>
            </name>
          </person-group>
          <year>2016</year>
          <article-title>Emerging problems of data quality in citizen science</article-title>
          <source>Conservation Biology</source>
          <volume>30</volume>
          <issue>3</issue>
          <fpage>447</fpage>
          <lpage>449</lpage>
          <pub-id pub-id-type="doi">10.1111/cobi.12706</pub-id>
        </element-citation>
      </ref>
      <ref id="B5571895">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maicher</surname>
              <given-names>Lutz</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>Khalil</given-names>
            </name>
            <name name-style="western">
              <surname>Isolani</surname>
              <given-names>Alida</given-names>
            </name>
            <name name-style="western">
              <surname>Kivelä</surname>
              <given-names>Aki</given-names>
            </name>
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>Sam</given-names>
            </name>
            <name name-style="western">
              <surname>Pitts</surname>
              <given-names>Antony</given-names>
            </name>
            <name name-style="western">
              <surname>Vassallo</surname>
              <given-names>Salvatore</given-names>
            </name>
          </person-group>
          <year>2009</year>
          <article-title>Topic maps in the eHumanities</article-title>
          <source>2009 Fifth IEEE International Conference on e-Science</source>
          <pub-id pub-id-type="doi">10.1109/e-science.2009.9</pub-id>
        </element-citation>
      </ref>
      <ref id="B5529774">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Menzel</surname>
              <given-names>Annette</given-names>
            </name>
            <name name-style="western">
              <surname>Fabian</surname>
              <given-names>Peter</given-names>
            </name>
          </person-group>
          <year>1999</year>
          <article-title>Growing season extended in Europe</article-title>
          <source>Nature</source>
          <volume>397</volume>
          <issue>6721</issue>
          <fpage>659</fpage>
          <lpage>659</lpage>
          <pub-id pub-id-type="doi">10.1038/17709</pub-id>
        </element-citation>
      </ref>
      <ref id="B5529806">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miller-Rushing</surname>
              <given-names>Abraham J.</given-names>
            </name>
            <name name-style="western">
              <surname>Primack</surname>
              <given-names>Richard B.</given-names>
            </name>
          </person-group>
          <year>2008</year>
          <article-title>Global warming and flowering times in Thoreau's concord: a community perspective.</article-title>
          <source>Ecology</source>
          <volume>89</volume>
          <issue>2</issue>
          <fpage>332</fpage>
          <lpage>341</lpage>
          <pub-id pub-id-type="doi">10.1890/07-0068.1</pub-id>
        </element-citation>
      </ref>
      <ref id="B5571908">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nadrowski</surname>
              <given-names>Karin</given-names>
            </name>
            <name name-style="western">
              <surname>Ratcliffe</surname>
              <given-names>Sophia</given-names>
            </name>
            <name name-style="western">
              <surname>Bönisch</surname>
              <given-names>Gerhard</given-names>
            </name>
            <name name-style="western">
              <surname>Bruelheide</surname>
              <given-names>Helge</given-names>
            </name>
            <name name-style="western">
              <surname>Kattge</surname>
              <given-names>Jens</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Xiaojuan</given-names>
            </name>
            <name name-style="western">
              <surname>Maicher</surname>
              <given-names>Lutz</given-names>
            </name>
            <name name-style="western">
              <surname>Mi</surname>
              <given-names>Xiangcheng</given-names>
            </name>
            <name name-style="western">
              <surname>Prilop</surname>
              <given-names>Michael</given-names>
            </name>
            <name name-style="western">
              <surname>Seifarth</surname>
              <given-names>Daniel</given-names>
            </name>
            <name name-style="western">
              <surname>Welter</surname>
              <given-names>Karl</given-names>
            </name>
            <name name-style="western">
              <surname>Windisch</surname>
              <given-names>Sven</given-names>
            </name>
            <name name-style="western">
              <surname>Wirth</surname>
              <given-names>Christian</given-names>
            </name>
          </person-group>
          <year>2012</year>
          <article-title>Harmonizing, annotating and sharing data in biodiversity-ecosystem functioning research</article-title>
          <source>Methods in Ecology and Evolution</source>
          <volume>4</volume>
          <issue>2</issue>
          <fpage>201</fpage>
          <lpage>205</lpage>
          <pub-id pub-id-type="doi">10.1111/2041-210x.12009</pub-id>
        </element-citation>
      </ref>
      <ref id="B5530280">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oetjen</surname>
              <given-names>Janina</given-names>
            </name>
            <name name-style="western">
              <surname>Aichler</surname>
              <given-names>Michaela</given-names>
            </name>
            <name name-style="western">
              <surname>Trede</surname>
              <given-names>Dennis</given-names>
            </name>
            <name name-style="western">
              <surname>Strehlow</surname>
              <given-names>Jan</given-names>
            </name>
            <name name-style="western">
              <surname>Berger</surname>
              <given-names>Judith</given-names>
            </name>
            <name name-style="western">
              <surname>Heldmann</surname>
              <given-names>Stefan</given-names>
            </name>
            <name name-style="western">
              <surname>Becker</surname>
              <given-names>Michael</given-names>
            </name>
            <name name-style="western">
              <surname>Gottschalk</surname>
              <given-names>Michael</given-names>
            </name>
            <name name-style="western">
              <surname>Kobarg</surname>
              <given-names>Jan Hendrik</given-names>
            </name>
            <name name-style="western">
              <surname>Wirtz</surname>
              <given-names>Stefan</given-names>
            </name>
            <name name-style="western">
              <surname>Schiffler</surname>
              <given-names>Stefan</given-names>
            </name>
            <name name-style="western">
              <surname>Thiele</surname>
              <given-names>Herbert</given-names>
            </name>
            <name name-style="western">
              <surname>Walch</surname>
              <given-names>Axel</given-names>
            </name>
            <name name-style="western">
              <surname>Maass</surname>
              <given-names>Peter</given-names>
            </name>
            <name name-style="western">
              <surname>Alexandrov</surname>
              <given-names>Theodore</given-names>
            </name>
          </person-group>
          <year>2013</year>
          <article-title>MRI-compatible pipeline for three-dimensional MALDI imaging mass spectrometry using PAXgene fixation</article-title>
          <source>Journal of Proteomics</source>
          <volume>90</volume>
          <fpage>52</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jprot.2013.03.013</pub-id>
        </element-citation>
      </ref>
      <ref id="B5529784">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Parmesan</surname>
              <given-names>Camille</given-names>
            </name>
            <name name-style="western">
              <surname>Yohe</surname>
              <given-names>Gary</given-names>
            </name>
          </person-group>
          <year>2003</year>
          <article-title>A globally coherent fingerprint of climate change impacts across natural systems</article-title>
          <source>Nature</source>
          <volume>421</volume>
          <issue>6918</issue>
          <fpage>37</fpage>
          <lpage>42</lpage>
          <pub-id pub-id-type="doi">10.1038/nature01286</pub-id>
        </element-citation>
      </ref>
      <ref id="B5530559">
        <element-citation publication-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pearl</surname>
              <given-names>Judea</given-names>
            </name>
          </person-group>
          <year>2009</year>
          <source>Causality: Models, reasoning and inference</source>
          <edition>Edition 2nd</edition>
          <publisher-name>Cambridge University Press</publisher-name>
          <publisher-loc>New York, NY, USA</publisher-loc>
          <pub-id pub-id-type="doi">10.1017/CBO9780511803161</pub-id>
        </element-citation>
      </ref>
      <ref id="B5530516">
        <element-citation publication-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>J.</given-names>
            </name>
            <name name-style="western">
              <surname>Janzing</surname>
              <given-names>D.</given-names>
            </name>
            <name name-style="western">
              <surname>Schölkopf</surname>
              <given-names>B.</given-names>
            </name>
          </person-group>
          <year>2017</year>
          <source>Elements of causal inference - foundations and learning algorithms</source>
          <publisher-name>The MIT Press</publisher-name>
          <publisher-loc>Cambridge, MA, USA</publisher-loc>
        </element-citation>
      </ref>
      <ref id="B5571937">
        <element-citation publication-type="thesis">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prilop</surname>
              <given-names>Michael</given-names>
            </name>
          </person-group>
          <year>2014</year>
          <source>Continuous data quality assessment in information systems</source>
          <publisher-name>Leipzig University</publisher-name>
        </element-citation>
      </ref>
      <ref id="B5548917">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reichenbach</surname>
              <given-names>J. R.</given-names>
            </name>
            <name name-style="western">
              <surname>Schweser</surname>
              <given-names>F.</given-names>
            </name>
            <name name-style="western">
              <surname>Serres</surname>
              <given-names>B.</given-names>
            </name>
            <name name-style="western">
              <surname>Deistung</surname>
              <given-names>A.</given-names>
            </name>
          </person-group>
          <year>2015</year>
          <article-title>Quantitative susceptibility mapping: Concepts and applications</article-title>
          <source>Clinical Neuroradiology</source>
          <volume>25</volume>
          <fpage>225</fpage>
          <lpage>230</lpage>
          <pub-id pub-id-type="doi">10.1007/s00062-015-0432-9</pub-id>
        </element-citation>
      </ref>
      <ref id="B5529794">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Root</surname>
              <given-names>Terry L.</given-names>
            </name>
            <name name-style="western">
              <surname>Price</surname>
              <given-names>Jeff T.</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>Kimberly R.</given-names>
            </name>
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>Stephen H.</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenzweig</surname>
              <given-names>Cynthia</given-names>
            </name>
            <name name-style="western">
              <surname>Pounds</surname>
              <given-names>J. Alan</given-names>
            </name>
          </person-group>
          <year>2003</year>
          <article-title>Fingerprints of global warming on wild animals and plants</article-title>
          <source>Nature</source>
          <volume>421</volume>
          <issue>6918</issue>
          <fpage>57</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1038/nature01333</pub-id>
        </element-citation>
      </ref>
      <ref id="B5545373">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Runge</surname>
              <given-names>Jakob</given-names>
            </name>
            <name name-style="western">
              <surname>Bathiany</surname>
              <given-names>Sebastian</given-names>
            </name>
            <name name-style="western">
              <surname>Bollt</surname>
              <given-names>Erik</given-names>
            </name>
            <name name-style="western">
              <surname>Camps-Valls</surname>
              <given-names>Gustau</given-names>
            </name>
            <name name-style="western">
              <surname>Coumou</surname>
              <given-names>Dim</given-names>
            </name>
            <name name-style="western">
              <surname>Deyle</surname>
              <given-names>Ethan</given-names>
            </name>
            <name name-style="western">
              <surname>Glymour</surname>
              <given-names>Clark</given-names>
            </name>
            <name name-style="western">
              <surname>Kretschmer</surname>
              <given-names>Marlene</given-names>
            </name>
            <name name-style="western">
              <surname>Mahecha</surname>
              <given-names>Miguel D.</given-names>
            </name>
            <name name-style="western">
              <surname>Muñoz-Marí</surname>
              <given-names>Jordi</given-names>
            </name>
            <name name-style="western">
              <surname>van Nes</surname>
              <given-names>Egbert H.</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>Jonas</given-names>
            </name>
            <name name-style="western">
              <surname>Quax</surname>
              <given-names>Rick</given-names>
            </name>
            <name name-style="western">
              <surname>Reichstein</surname>
              <given-names>Markus</given-names>
            </name>
            <name name-style="western">
              <surname>Scheffer</surname>
              <given-names>Marten</given-names>
            </name>
            <name name-style="western">
              <surname>Schölkopf</surname>
              <given-names>Bernhard</given-names>
            </name>
            <name name-style="western">
              <surname>Spirtes</surname>
              <given-names>Peter</given-names>
            </name>
            <name name-style="western">
              <surname>Sugihara</surname>
              <given-names>George</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Jie</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Kun</given-names>
            </name>
            <name name-style="western">
              <surname>Zscheischler</surname>
              <given-names>Jakob</given-names>
            </name>
          </person-group>
          <year>2019</year>
          <article-title>Inferring causation from time series in Earth system sciences</article-title>
          <source>Nature Communications</source>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>2553</fpage>
          <pub-id pub-id-type="doi">10.1038/s41467-019-10105-3</pub-id>
        </element-citation>
      </ref>
      <ref id="B5529076">
        <element-citation publication-type="conference-preoceeding">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Samuel</surname>
              <given-names>Sheeba</given-names>
            </name>
            <name name-style="western">
              <surname>Groeneveld</surname>
              <given-names>Kathrin</given-names>
            </name>
            <name name-style="western">
              <surname>Taubert</surname>
              <given-names>Frank</given-names>
            </name>
            <name name-style="western">
              <surname>Walther</surname>
              <given-names>Daniel</given-names>
            </name>
            <name name-style="western">
              <surname>Kache</surname>
              <given-names>Tom</given-names>
            </name>
            <name name-style="western">
              <surname>Langenstück</surname>
              <given-names>Teresa</given-names>
            </name>
            <name name-style="western">
              <surname>König-Ries</surname>
              <given-names>Birgitta</given-names>
            </name>
            <name name-style="western">
              <surname>Bücker</surname>
              <given-names>H. Martin</given-names>
            </name>
            <name name-style="western">
              <surname>Biskup</surname>
              <given-names>Christoph</given-names>
            </name>
          </person-group>
          <year>2018</year>
          <source>The Story of an experiment: a provenance-based semantic approach towards research reproducibility</source>
          <conf-name>Proceedings of the 11th International Conference Semantic Web Applications and Tools for Life Sciences, SWAT4LS 2018, Antwerp, Belgium, December 3-6, 2018</conf-name>
        </element-citation>
      </ref>
      <ref id="B5529911">
        <element-citation publication-type="conference-preoceeding">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schelter</surname>
              <given-names>Sebastian</given-names>
            </name>
            <name name-style="western">
              <surname>Böse</surname>
              <given-names>Joos-Hendrik</given-names>
            </name>
            <name name-style="western">
              <surname>Kirschnick</surname>
              <given-names>Johannes</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>Thoralf</given-names>
            </name>
            <name name-style="western">
              <surname>Seufert</surname>
              <given-names>Stephan</given-names>
            </name>
          </person-group>
          <year>2018</year>
          <source>Declarative metadata management: A missing piece in end-to-end machine learning</source>
          <conf-name>Proceedings of SYSML’18, Feb 2018, Stanford, USA</conf-name>
        </element-citation>
      </ref>
      <ref id="B5529816">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Senapathi</surname>
              <given-names>D.</given-names>
            </name>
            <name name-style="western">
              <surname>Carvalheiro</surname>
              <given-names>L. G.</given-names>
            </name>
            <name name-style="western">
              <surname>Biesmeijer</surname>
              <given-names>J. C.</given-names>
            </name>
            <name name-style="western">
              <surname>Dodson</surname>
              <given-names>C. -A.</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>R. L.</given-names>
            </name>
            <name name-style="western">
              <surname>McKerchar</surname>
              <given-names>M.</given-names>
            </name>
            <name name-style="western">
              <surname>Morton</surname>
              <given-names>R. D.</given-names>
            </name>
            <name name-style="western">
              <surname>Moss</surname>
              <given-names>E. D.</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>S. P. M.</given-names>
            </name>
            <name name-style="western">
              <surname>Kunin</surname>
              <given-names>W. E.</given-names>
            </name>
            <name name-style="western">
              <surname>Potts</surname>
              <given-names>S. G.</given-names>
            </name>
          </person-group>
          <year>2015</year>
          <article-title>The impact of over 80 years of land cover changes on bee and wasp pollinator communities in England</article-title>
          <source>Proceedings of the Royal Society B: Biological Sciences</source>
          <volume>282</volume>
          <issue>1806</issue>
          <fpage>20150294</fpage>
          <lpage>20150294</lpage>
          <pub-id pub-id-type="doi">10.1098/rspb.2015.0294</pub-id>
        </element-citation>
      </ref>
      <ref id="B5530496">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Seth</surname>
              <given-names>Anil K.</given-names>
            </name>
            <name name-style="western">
              <surname>Barrett</surname>
              <given-names>Adam B.</given-names>
            </name>
            <name name-style="western">
              <surname>Barnett</surname>
              <given-names>Lionel</given-names>
            </name>
          </person-group>
          <year>2015</year>
          <article-title>Granger causality analysis in neuroscience and neuroimaging</article-title>
          <source>Journal of Neuroscience</source>
          <volume>35</volume>
          <issue>8</issue>
          <fpage>3293</fpage>
          <lpage>3297</lpage>
          <pub-id pub-id-type="doi">10.1523/JNEUROSCI.4399-14.2015</pub-id>
        </element-citation>
      </ref>
      <ref id="B5545341">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shadaydeh</surname>
              <given-names>Maha</given-names>
            </name>
            <name name-style="western">
              <surname>Denzler</surname>
              <given-names>Joachim</given-names>
            </name>
            <name name-style="western">
              <surname>García</surname>
              <given-names>Yanira Guanche</given-names>
            </name>
            <name name-style="western">
              <surname>Mahecha</surname>
              <given-names>Miguel</given-names>
            </name>
          </person-group>
          <year>2019</year>
          <article-title>Time-frequency causal inference uncovers anomalous events in environmental systems</article-title>
          <source>Lecture Notes in Computer Science</source>
          <fpage>499</fpage>
          <lpage>512</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-030-33676-9_35</pub-id>
        </element-citation>
      </ref>
      <ref id="B5530779">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>Hongyu</given-names>
            </name>
            <name name-style="western">
              <surname>George</surname>
              <given-names>Daniel</given-names>
            </name>
            <name name-style="western">
              <surname>Huerta</surname>
              <given-names>E. A.</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Zhizhen</given-names>
            </name>
          </person-group>
          <year>2017</year>
          <article-title>Denoising gravitational waves using deep learning with recurrent denoising autoencoders</article-title>
          <source>arXiv: 1711.09919</source>
          <pub-id pub-id-type="doi">10.1109/ICASSP.2019.8683061</pub-id>
        </element-citation>
      </ref>
      <ref id="B5528958">
        <element-citation publication-type="conference-preoceeding">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Taigman</surname>
              <given-names>Yaniv</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Ming</given-names>
            </name>
            <name name-style="western">
              <surname>Ranzato</surname>
              <given-names>Marc'Aurelio</given-names>
            </name>
            <name name-style="western">
              <surname>Wolf</surname>
              <given-names>Lior</given-names>
            </name>
          </person-group>
          <year>2014</year>
          <source>DeepFace: closing the gap to human-level performance in face verification</source>
          <conf-name>Proceedings of the 2014 IEEE Conference on Computer Vision and Pattern Recognition</conf-name>
          <pub-id pub-id-type="doi">10.1109/CVPR.2014.220</pub-id>
        </element-citation>
      </ref>
      <ref id="B5545361">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Trifunov</surname>
              <given-names>Violeta Teodora</given-names>
            </name>
            <name name-style="western">
              <surname>Shadaydeh</surname>
              <given-names>Maha</given-names>
            </name>
            <name name-style="western">
              <surname>Runge</surname>
              <given-names>Jakob</given-names>
            </name>
            <name name-style="western">
              <surname>Eyring</surname>
              <given-names>Veronika</given-names>
            </name>
            <name name-style="western">
              <surname>Reichstein</surname>
              <given-names>Markus</given-names>
            </name>
            <name name-style="western">
              <surname>Denzler</surname>
              <given-names>Joachim</given-names>
            </name>
          </person-group>
          <year>2019</year>
          <article-title>Nonlinear causal link estimation under hidden confounding with an application to time series anomaly detection</article-title>
          <source>Lecture Notes in Computer Science</source>
          <fpage>261</fpage>
          <lpage>273</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-030-33676-9_18</pub-id>
        </element-citation>
      </ref>
      <ref id="B5552189">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vogelbacher</surname>
              <given-names>C.</given-names>
            </name>
            <name name-style="western">
              <surname>Bopp</surname>
              <given-names>M. H.A.</given-names>
            </name>
            <name name-style="western">
              <surname>Schuster</surname>
              <given-names>V.</given-names>
            </name>
            <name name-style="western">
              <surname>Herholz</surname>
              <given-names>P.</given-names>
            </name>
            <name name-style="western">
              <surname>Jansen</surname>
              <given-names>A.</given-names>
            </name>
            <name name-style="western">
              <surname>Sommer</surname>
              <given-names>J.</given-names>
            </name>
          </person-group>
          <year>2019</year>
          <article-title>LAB-QA2GO: A free, easy-to-use toolbox for the quality assessment of magnetic resonance imaging data</article-title>
          <source>Frontiers in Neuroscience</source>
          <volume>13</volume>
          <fpage>688</fpage>
          <pub-id pub-id-type="doi">10.3389/fnins.2019.00688</pub-id>
        </element-citation>
      </ref>
      <ref id="B5530240">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>von Eggeling</surname>
              <given-names>Ferdinand</given-names>
            </name>
            <name name-style="western">
              <surname>Crecelius</surname>
              <given-names>Anna C.</given-names>
            </name>
            <name name-style="western">
              <surname>Schubert</surname>
              <given-names>Ulrich S.</given-names>
            </name>
            <name name-style="western">
              <surname>Guntinas-Lichius</surname>
              <given-names>Orlando</given-names>
            </name>
            <name name-style="western">
              <surname>Ernst</surname>
              <given-names>Günther</given-names>
            </name>
          </person-group>
          <year>2012</year>
          <article-title>MALDI-Imaging: What can be expected?</article-title>
          <source>European Journal of Radiology</source>
          <volume>81</volume>
          <fpage>183</fpage>
          <lpage>184</lpage>
          <pub-id pub-id-type="doi">10.1016/s0720-048x(12)70075-x</pub-id>
        </element-citation>
      </ref>
      <ref id="B5529922">
        <element-citation publication-type="article">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Walls</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Deck</surname>
              <given-names>John</given-names>
            </name>
            <name name-style="western">
              <surname>Guralnick</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Baskauf</surname>
              <given-names>Steve</given-names>
            </name>
            <name name-style="western">
              <surname>Beaman</surname>
              <given-names>Reed</given-names>
            </name>
            <name name-style="western">
              <surname>Blum</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bowers</surname>
              <given-names>S.</given-names>
            </name>
            <name name-style="western">
              <surname>Buttigieg</surname>
              <given-names>P. L.</given-names>
            </name>
            <name name-style="western">
              <surname>Davies</surname>
              <given-names>N.</given-names>
            </name>
            <name name-style="western">
              <surname>Endresen</surname>
              <given-names>D.</given-names>
            </name>
            <name name-style="western">
              <surname>et al.</surname>
            </name>
          </person-group>
          <year>2014</year>
          <article-title>Semantics in support of biodiversity knowledge discovery: an introduction to the biological collections ontology and related ontologies</article-title>
          <source>PLOS One</source>
          <volume>9</volume>
          <issue>3</issue>
          <fpage>e89606</fpage>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0089606</pub-id>
        </element-citation>
      </ref>
    </ref-list>
    <fn-group>
      <fn id="FN5540622">
        <label>*1</label>
        <p>“Werkstatt” is the German term for “workshop” (in the sense of manufactory)</p>
      </fn>
    </fn-group>
  </back>
  <floats-group>
    <fig id="F5540620" position="float" orientation="portrait">
      <object-id content-type="arpha">DFCD371A-DC35-5403-9928-8C6A24844349</object-id>
      <object-id content-type="doi">10.3897/rio.6.e54106.figure1</object-id>
      <label>Figure 1.</label>
      <caption>
        <p>Integration of the "Werkstatt" in the Friedrich Schiller University and the research center of Jena.</p>
      </caption>
      <graphic xlink:href="rio-06-e54106-g001.png" position="float" id="oo_383912.png" orientation="portrait" xlink:type="simple">
        <uri content-type="original_file">https://binary.pensoft.net/fig/383912</uri>
      </graphic>
    </fig>
    <table-wrap id="T5545429" position="float" orientation="portrait">
      <label>Table 1.</label>
      <caption>
        <p>Project overview and coverage of the four main themes: T1. Generic tools for machine learning, T2. Knowledge generation using machine learning processes, T3. Semantic methods for the data life cycle, and T4. Applications (black/empty square indicates primary/secondary contribution).</p>
      </caption>
      <table rules="all" border="1" style="height: 423px; width: 671px;">
        <tbody>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">
              <bold>Project</bold>
            </td>
            <td rowspan="1" colspan="1" style="width: 63px;">
              <bold>T1</bold>
            </td>
            <td rowspan="1" colspan="1" style="width: 61px;">
              <bold>T2</bold>
            </td>
            <td rowspan="1" colspan="1" style="width: 56px;">
              <bold>T3</bold>
            </td>
            <td rowspan="1" colspan="1" style="width: 53px;">
              <bold>T4</bold>
            </td>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Core Project C1: Automatic machine learning</td>
            <td rowspan="1" colspan="1" style="width: 63px;">⬛</td>
            <td rowspan="1" colspan="1" style="width: 61px;">▢</td>
            <td rowspan="1" colspan="1" style="width: 56px;"/>
            <td rowspan="1" colspan="1" style="width: 53px;"/>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Pilot Project P1: Probabilistic modeling</td>
            <td rowspan="1" colspan="1" style="width: 63px;">⬛</td>
            <td rowspan="1" colspan="1" style="width: 61px;">▢</td>
            <td rowspan="1" colspan="1" style="width: 56px;"/>
            <td rowspan="1" colspan="1" style="width: 53px;"/>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Core Project C2: Generative models</td>
            <td rowspan="1" colspan="1" style="width: 63px;"/>
            <td rowspan="1" colspan="1" style="width: 61px;">⬛</td>
            <td rowspan="1" colspan="1" style="width: 56px;">▢</td>
            <td rowspan="1" colspan="1" style="width: 53px;">▢</td>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Pilot Project P2: Detection of causal relationships using deep learning</td>
            <td rowspan="1" colspan="1" style="width: 63px;"/>
            <td rowspan="1" colspan="1" style="width: 61px;">⬛</td>
            <td rowspan="1" colspan="1" style="width: 56px;"/>
            <td rowspan="1" colspan="1" style="width: 53px;">▢</td>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Pilot Project P3: Virus diagnostics I (Methods)</td>
            <td rowspan="1" colspan="1" style="width: 63px;"/>
            <td rowspan="1" colspan="1" style="width: 61px;">⬛</td>
            <td rowspan="1" colspan="1" style="width: 56px;"/>
            <td rowspan="1" colspan="1" style="width: 53px;">▢</td>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Core Project C3: Provenance management</td>
            <td rowspan="1" colspan="1" style="width: 63px;"/>
            <td rowspan="1" colspan="1" style="width: 61px;"/>
            <td rowspan="1" colspan="1" style="width: 56px;">⬛</td>
            <td rowspan="1" colspan="1" style="width: 53px;">▢</td>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Pilot Project P4: Data curation</td>
            <td rowspan="1" colspan="1" style="width: 63px;"/>
            <td rowspan="1" colspan="1" style="width: 61px;"/>
            <td rowspan="1" colspan="1" style="width: 56px;">⬛</td>
            <td rowspan="1" colspan="1" style="width: 53px;">▢</td>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Pilot Project P5: Annotation</td>
            <td rowspan="1" colspan="1" style="width: 63px;"/>
            <td rowspan="1" colspan="1" style="width: 61px;">▢</td>
            <td rowspan="1" colspan="1" style="width: 56px;">⬛</td>
            <td rowspan="1" colspan="1" style="width: 53px;">▢</td>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Pilot Project P6: Gravitational waves</td>
            <td rowspan="1" colspan="1" style="width: 63px;">▢</td>
            <td rowspan="1" colspan="1" style="width: 61px;">▢</td>
            <td rowspan="1" colspan="1" style="width: 56px;"/>
            <td rowspan="1" colspan="1" style="width: 53px;">⬛</td>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Pilot Project P7: Head and neck cancer</td>
            <td rowspan="1" colspan="1" style="width: 63px;"/>
            <td rowspan="1" colspan="1" style="width: 61px;">▢</td>
            <td rowspan="1" colspan="1" style="width: 56px;"/>
            <td rowspan="1" colspan="1" style="width: 53px;">⬛</td>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Pilot Project P8: MRI data</td>
            <td rowspan="1" colspan="1" style="width: 63px;"/>
            <td rowspan="1" colspan="1" style="width: 61px;"/>
            <td rowspan="1" colspan="1" style="width: 56px;"/>
            <td rowspan="1" colspan="1" style="width: 53px;">⬛</td>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Pilot Project P9: Phenology</td>
            <td rowspan="1" colspan="1" style="width: 63px;"/>
            <td rowspan="1" colspan="1" style="width: 61px;">▢</td>
            <td rowspan="1" colspan="1" style="width: 56px;">▢</td>
            <td rowspan="1" colspan="1" style="width: 53px;">⬛</td>
          </tr>
          <tr>
            <td rowspan="1" colspan="1" style="width: 367px;">Pilot Project P10: Virus diagnostics II (applications)</td>
            <td rowspan="1" colspan="1" style="width: 63px;"/>
            <td rowspan="1" colspan="1" style="width: 61px;">▢</td>
            <td rowspan="1" colspan="1" style="width: 56px;"/>
            <td rowspan="1" colspan="1" style="width: 53px;">⬛</td>
          </tr>
        </tbody>
      </table>
    </table-wrap>
  </floats-group>
</article>
