<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="review-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v26i1e51297</article-id>
      <article-id pub-id-type="pmid">39178413</article-id>
      <article-id pub-id-type="doi">10.2196/51297</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Review</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Review</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Provenance Information for Biomedical Data and Workflows: Scoping Review</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Cai</surname>
            <given-names>Jingheng</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Budde</surname>
            <given-names>Kai</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Gierend</surname>
            <given-names>Kerstin</given-names>
          </name>
          <degrees>Dipl-Inf(FH)</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Biomedical Informatics</institution>
            <institution>Mannheim Institute for intelligent Systems in Medicine</institution>
            <institution>Medical Faculty Mannheim, Heidelberg University</institution>
            <addr-line>Theodor-Kutzer-Ufer 1-3</addr-line>
            <addr-line>Mannheim, 68167</addr-line>
            <country>Germany</country>
            <phone>49 621383 ext 8087</phone>
            <email>kerstin.gierend@medma.uni-heidelberg.de</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0417-3454</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Krüger</surname>
            <given-names>Frank</given-names>
          </name>
          <degrees>Dr.-Ing.</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7925-3363</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Genehr</surname>
            <given-names>Sascha</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1702-6878</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Hartmann</surname>
            <given-names>Francisca</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-2727-9148</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Siegel</surname>
            <given-names>Fabian</given-names>
          </name>
          <degrees>Dr med</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9673-5030</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Waltemath</surname>
            <given-names>Dagmar</given-names>
          </name>
          <degrees>Dr-Ing</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5886-5563</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Ganslandt</surname>
            <given-names>Thomas</given-names>
          </name>
          <degrees>Dr med habi.</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6864-8936</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Zeleke</surname>
            <given-names>Atinkut Alamirrew</given-names>
          </name>
          <degrees>Dr rer medic</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7838-9050</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Biomedical Informatics</institution>
        <institution>Mannheim Institute for intelligent Systems in Medicine</institution>
        <institution>Medical Faculty Mannheim, Heidelberg University</institution>
        <addr-line>Mannheim</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Faculty of Engineering</institution>
        <institution>Wismar University of Applied Sciences</institution>
        <addr-line>Wismar</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Institute of Communications Engineering</institution>
        <institution>University of Rostock</institution>
        <addr-line>Rostock</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Medical Informatics</institution>
        <institution>University Medicine Greifswald</institution>
        <addr-line>Greifswald</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Chair of Medical Informatics</institution>
        <institution>Friedrich-Alexander-Universität Erlangen-Nürnberg</institution>
        <addr-line>Erlangen</addr-line>
        <country>Germany</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Kerstin Gierend <email>kerstin.gierend@medma.uni-heidelberg.de</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>23</day>
        <month>8</month>
        <year>2024</year>
      </pub-date>
      <volume>26</volume>
      <elocation-id>e51297</elocation-id>
      <history>
        <date date-type="received">
          <day>27</day>
          <month>7</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>10</day>
          <month>5</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>30</day>
          <month>5</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>17</day>
          <month>6</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Kerstin Gierend, Frank Krüger, Sascha Genehr, Francisca Hartmann, Fabian Siegel, Dagmar Waltemath, Thomas Ganslandt, Atinkut Alamirrew Zeleke. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 23.08.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2024/1/e51297" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The record of the origin and the history of data, known as provenance, holds importance. Provenance information leads to higher interpretability of scientific results and enables reliable collaboration and data sharing. However, the lack of comprehensive evidence on provenance approaches hinders the uptake of good scientific practice in clinical research.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This scoping review aims to identify approaches and criteria for provenance tracking in the biomedical domain. We reviewed the state-of-the-art frameworks, associated artifacts, and methodologies for provenance tracking.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>This scoping review followed the methodological framework developed by Arksey and O’Malley. We searched the PubMed and Web of Science databases for English-language articles published from 2006 to 2022. Title and abstract screening were carried out by 4 independent reviewers using the Rayyan screening tool. A majority vote was required for consent on the eligibility of papers based on the defined inclusion and exclusion criteria. Full-text reading and screening were performed independently by 2 reviewers, and information was extracted into a pretested template for the 5 research questions. Disagreements were resolved by a domain expert. The study protocol has previously been published.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The search resulted in a total of 764 papers. Of 624 identified, deduplicated papers, 66 (10.6%) studies fulfilled the inclusion criteria. We identified diverse provenance-tracking approaches ranging from practical provenance processing and managing to theoretical frameworks distinguishing diverse concepts and details of data and metadata models, provenance components, and notations. A substantial majority investigated underlying requirements to varying extents and validation intensities but lacked completeness in provenance coverage. Mostly, cited requirements concerned the knowledge about data integrity and reproducibility. Moreover, these revolved around robust data quality assessments, consistent policies for sensitive data protection, improved user interfaces, and automated ontology development. We found that different stakeholder groups benefit from the availability of provenance information. Thereby, we recognized that the term <italic>provenance</italic> is subjected to an evolutionary and technical process with multifaceted meanings and roles. Challenges included organizational and technical issues linked to data annotation, provenance modeling, and performance, amplified by subsequent matters such as enhanced provenance information and quality principles.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>As data volumes grow and computing power increases, the challenge of scaling provenance systems to handle data efficiently and assist complex queries intensifies, necessitating automated and scalable solutions. With rising legal and scientific demands, there is an urgent need for greater transparency in implementing provenance systems in research projects, despite the challenges of unresolved granularity and knowledge bottlenecks. We believe that our recommendations enable quality and guide the implementation of auditable and measurable provenance approaches as well as solutions in the daily tasks of biomedical scientists.</p>
        </sec>
        <sec sec-type="registered-report">
          <title>International Registered Report Identifier (IRRID)</title>
          <p>RR2-10.2196/31750</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>provenance</kwd>
        <kwd>biomedical research</kwd>
        <kwd>data management</kwd>
        <kwd>scoping review</kwd>
        <kwd>health care data</kwd>
        <kwd>software life cycle</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Both the use and reuse of electronic medical and patient-related data offers enormous potential for clinical research [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. National programs such as the German Medical Informatics Initiatives support knowledge discovery and data sharing using adequate computational infrastructure and secure processes [<xref ref-type="bibr" rid="ref3">3</xref>]. In this context, provenance information (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>) offers access to quality assured, traceable, and credible shared data. These and other advantages of data provenance have been demonstrated, for instance, in the EU Horizon 2020 TRANSFORM project [<xref ref-type="bibr" rid="ref4">4</xref>] or in the MeDaX Knowledge Graph Prototype [<xref ref-type="bibr" rid="ref5">5</xref>]. Schröder et al [<xref ref-type="bibr" rid="ref6">6</xref>] provided an “Electronic Laboratory Notebook” use case in the wet lab to show how provenance supports the understanding and reproducibility of research investigations. At the same time, researchers not considering the origin of data run into the hazard of systematically incomplete or wrong data [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
        <p>Notably, the FAIR (findable, accessible, interoperable, reusable) guiding principles for data stewardship [<xref ref-type="bibr" rid="ref9">9</xref>] explicitly mention provenance [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. A provenance-oriented approach requires thorough planning, execution, and evaluation of data management processes in the respective application domain [<xref ref-type="bibr" rid="ref2">2</xref>]. In the scientific context, adherence to criteria such as consistency, interoperability, and confidentiality are generally required across all software tools [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>].</p>
        <p>The concept and implementation of provenance are essential for most scientific domains, such as environmental fields (geoprocessing workflows or climate assessments), in nuclear fusion engineering, or material sciences [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. In particular, the biomedical domains demand comprehensive investigation and information about their data management scenarios, including extract, transform, load jobs for data transfer and integration. Reliable data and data pipelines both require provenance data to be embedded in concepts for traceability to understand the relationships between results and source data.</p>
        <boxed-text id="box1" position="float">
          <title>Provenance terminology.</title>
          <p>
            <bold>Definition</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p>“Provenance” is a description of what happened to a data item [<xref ref-type="bibr" rid="ref4">4</xref>]. Information models such as the World Wide Web Consortium (W3C) PROV standard formally define provenance of a resource as “a record that describes entities and processes involved in producing and delivering or otherwise influencing that resource” [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>Our work reviews approaches and criteria for provenance tracking in the biomedical domain and discloses current knowledge gaps. This comprises modeling aspects and metadata frameworks for meaningful and usable provenance information during the creation, collection, and processing of  scientific biomedical data. The review also covers the examination of quality aspects relating to provenance.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>We followed the scoping methodological framework developed by Arksey and O’Malley [<xref ref-type="bibr" rid="ref16">16</xref>] for conducting a scoping review with the following stages: (1) stage 1—identification of the research questions (RQs); (2) stage 2—identification of relevant studies; (3) stage 3—study selection; (4) stage 4—data extraction and charting; and (5) stage 5—collating, summarizing, and reporting the results.</p>
      </sec>
      <sec>
        <title>Change From the Original Protocol</title>
        <p>The protocol of this scoping review has been published in <italic>JMIR Research Protocols</italic> (international registered report identifier DERR1-10.2196/31750) [<xref ref-type="bibr" rid="ref17">17</xref>]. In accordance with the original protocol developed for this scoping review, the search period was initially planned to include studies published from January 2006 to March 2021. However, due to the extensive nature of the data extraction and write-up process, it became apparent that additional time was necessary to ensure a comprehensive analysis of the relevant literature. As a result, we extended the search period from 2006 to the end of 2022.</p>
        <p>No other changes were made to the original protocol. Thematic analysis methods were applied to analyze the extracted data by organizing themes according to the RQs [<xref ref-type="bibr" rid="ref18">18</xref>]. In line with the framework developed by Arksey and O’Malley [<xref ref-type="bibr" rid="ref16">16</xref>], the review does not attempt to assess the quality of studies or the risk of bias. It also does not assess the generalizability of the results.</p>
      </sec>
      <sec>
        <title>Stage 1: Identifying RQs</title>
        <p>The main objective of this review was to investigate existing evidence regarding approaches and criteria for provenance tracking and disclosing current knowledge gaps in the biomedical domain. The objective led to the following RQs:</p>
        <list list-type="bullet">
          <list-item>
            <p>RQ1: Which potential (methodological) approaches exist for the classification and tracking of provenance criteria and methods in a biomedical or domain-independent context?</p>
          </list-item>
          <list-item>
            <p>RQ2: How can the potential value of provenance information be harnessed and by whom? How can usability be provided?</p>
          </list-item>
          <list-item>
            <p>RQ3: What are the challenges and potential problems or bottlenecks for the accomplishment of provenance?</p>
          </list-item>
          <list-item>
            <p>RQ4: Which guidelines or demands for the consideration of provenance criteria in a biomedical or domain-independent context have to be followed?</p>
          </list-item>
          <list-item>
            <p>RQ5: How completely can provenance be mapped in the data life cycle or during data management?</p>
          </list-item>
        </list>
      </sec>
      <sec>
        <title>Stage 2: Identifying Relevant Studies</title>
        <p>Concepts and matching keywords were categorized into 4 groups (<xref ref-type="table" rid="table1">Table 1</xref>): <italic>target domain</italic> refers to the context of the research topic and includes studies with a biomedical, health care, clinical, or scientific background. In this work, scientific background is limited to domain-independent studies and excludes all other domain-specific studies. <italic>Provenance</italic> concerns the information about the genesis of a given object. <italic>Provenance properties</italic> cover specific requirements tied to the term <italic>provenance</italic>; they also describe selected characteristics in this context. <italic>Objective</italic> includes the purposes or intention of provenance capture. The comprehensive search strategy is recorded in the study protocol [<xref ref-type="bibr" rid="ref17">17</xref>], and search strings combined with Boolean operators are attached (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Concepts and matching keywords (eligibility criteria).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="270"/>
            <col width="730"/>
            <thead>
              <tr valign="top">
                <td>Concepts</td>
                <td>Matching keywords (inclusion criteria)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Target domain</td>
                <td>biomed*<sup>a</sup>, EHR, electronic health record, health care, clinical, scientific<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Provenance</td>
                <td>provenance, prov, lineage</td>
              </tr>
              <tr valign="top">
                <td>Provenance properties</td>
                <td>interop*, (data NEAR/2 [flow, quality, transformation]), metadata, workflow, semantic, framework, annotat*, ontolog*, management, document*, (model NEAR/2 provenance)</td>
              </tr>
              <tr valign="top">
                <td>Objective</td>
                <td>audit*, decision support, ETL, Extract-Transform-Load, FHIR, record linking, machine learning, reproducib*, transparen*, track*, implement*</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>The * symbol (wildcard character) replaces or represents one or more characters.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>Will be used in a domain-independent context only.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Stage 3: Study Selection</title>
        <p>The PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) flowchart depicts the selection process. First, we identified all relevant studies in the PubMed and Web of Science databases based on our search strategy. After deduplication, we launched a transparent screening process by importing all relevant studies into Rayyan [<xref ref-type="bibr" rid="ref19">19</xref>], a systematic review supporting solution. The studies were then reviewed by at least 2 independent researchers. In the case of vote agreement, the study was either included in the next review phase or excluded from the review. A third independent reviewer was consulted to solve the conflict if no consensus could be reached. The study screening phase started with a title and abstract evaluation for eligibility. Included studies were submitted to a full-text screening, while performing a thorough investigation on the study report. Reviewers voted for inclusion or exclusion considering the inclusion and exclusion criteria. Finally, the residing set of qualified studies was moved into the data extraction pipeline. A description of the study selection is provided in the protocol [<xref ref-type="bibr" rid="ref17">17</xref>].</p>
        <p>Studies were included if they (1) were focused on the biomedical domain or were domain independent, (2) described provenance-tracking approaches, and (3) were written in English. Studies were excluded if they (1) were not specific to the biomedical or general domain, (2) were gray literature, and (3) did not focus on provenance-tracking approaches.</p>
      </sec>
      <sec>
        <title>Stage 4: Charting the Data</title>
        <p>We followed a collaborative and iterative process to define a charting table for data extraction. Individual reviewers (KG, FK, FH, SG, AAZ, and DW) then scrutinized all studies and extracted central textual occurrences into the data extraction sheet. The variables in the data extraction sheet correspond with the RQs. General characteristics of the studies, approaches for classification and tracking of provenance, and their associated challenges along with the significance and completeness of provenance information in the given context were part of the investigational charting. The reviewers independently charted the data in a structured and consistent way and discussed the results.</p>
      </sec>
      <sec>
        <title>Stage 5: Collating, Summarizing, and Reporting the Results</title>
        <p>The extracted data were analyzed using summary statistics by calculating the total number and percentages of all studies per category, if applicable. Charts were presented for the distribution of the individual data elements where applicable. The data analysis was partially supported with scripts in Python (version 3.10.0) [<xref ref-type="bibr" rid="ref20">20</xref>]. Plots were generated with R version 4.0.4 (R Core Team) [<xref ref-type="bibr" rid="ref21">21</xref>] and version 1.3.0 of the <italic>tidyverse</italic> package [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
        <p>Further analysis was performed using qualitative evaluation. The reporting of the results and outcomes was structured according to the RQs. On the basis of the analysis of the review results, we have developed a road map for a customized provenance framework that considers the life cycle of the software framework (Provenance-Software Framework Life Cycle [SFL]). Implications for future research, practice, and policy makers were outlined. Our reporting adheres to the PRISMA-ScR (Preferred Reporting Items for Systematic Reviews and Meta-Analyses Extension for Scoping Reviews) reporting guidelines [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Literature Search</title>
        <p>The search in the PubMed and Web of Science databases resulted in 764 hits and included papers from January 1, 2006, to December 31, 2022. Afterward, 140 duplicates were removed. The remaining 624 papers were subjected to title-abstract screening in an interactive selection process, leaving 118 eligible papers for the full-text review. The full-text papers were further screened to identify papers eligible for the subsequent step of data charting. During this step, additional 52 papers were excluded (see the Stage 4: Charting the Data section). These papers either did not meet the study design context (31/52, 60%) or they lacked the domain concept (15/52, 29%). Four papers reported the same study or contained parts of it, and 2 were not a full paper. A total of 66 articles were included in the data extraction phase (<xref ref-type="table" rid="table2">Table 2</xref>). The paper selection followed the PRISMA [<xref ref-type="bibr" rid="ref24">24</xref>] approach (<xref rid="figure1" ref-type="fig">Figure 1</xref>), and the PRISMA-ScR checklist is presented in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>List of included papers.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="110"/>
            <col width="660"/>
            <col width="230"/>
            <thead>
              <tr valign="top">
                <td>Number</td>
                <td>Title</td>
                <td>Study</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>Clinical Text Mining on FHIR</td>
                <td>Daumke et al [<xref ref-type="bibr" rid="ref25">25</xref>], 2019</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>Provenance Solutions for Medical Research in Heterogeneous IT-Infrastructure: An Implementation Roadmap</td>
                <td>Parciak et al [<xref ref-type="bibr" rid="ref26">26</xref>], 2019</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>BioWorkbench: a high-performance framework for managing and analyzing bioinformatics experiments</td>
                <td>Mondelli et al [<xref ref-type="bibr" rid="ref27">27</xref>], 2018</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>Towards structured sharing of raw and derived neuroimaging data across existing resources</td>
                <td>Keator et al [<xref ref-type="bibr" rid="ref28">28</xref>], 2013</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>A unified framework for managing provenance information in translational research</td>
                <td>Sahoo et al [<xref ref-type="bibr" rid="ref13">13</xref>], 2011</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>Towards FAIR protocols and workflows: the OpenPREDICT use case</td>
                <td>Celebi et al [<xref ref-type="bibr" rid="ref29">29</xref>], 2020</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>A Survey on Collecting, Managing, and Analyzing Provenance from Scripts</td>
                <td>Pimentel et al [<xref ref-type="bibr" rid="ref30">30</xref>], 2019</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>Reproducibility Analysis of Scientific Workflows</td>
                <td>Bánáti et al [<xref ref-type="bibr" rid="ref31">31</xref>], 2017</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>Implementing interoperable provenance in biomedical research</td>
                <td>Curcin et al [<xref ref-type="bibr" rid="ref1">1</xref>], 2014</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>Why linked data is not enough for scientists</td>
                <td>Bechhofer et al [<xref ref-type="bibr" rid="ref32">32</xref>], 2013</td>
              </tr>
              <tr valign="top">
                <td>11</td>
                <td>Representing distributed systems using the Open Provenance Model</td>
                <td>Groth and Moreau [<xref ref-type="bibr" rid="ref33">33</xref>], 2011</td>
              </tr>
              <tr valign="top">
                <td>12</td>
                <td>A Semantic Web approach to the provenance challenge</td>
                <td>Golbeck and Hendler [<xref ref-type="bibr" rid="ref34">34</xref>], 2008</td>
              </tr>
              <tr valign="top">
                <td>13</td>
                <td>Applying content management to automated provenance capture</td>
                <td>Schuchardt et al [<xref ref-type="bibr" rid="ref35">35</xref>], 2008</td>
              </tr>
              <tr valign="top">
                <td>14</td>
                <td>The Generalized Data Model for clinical research</td>
                <td>Danese et al [<xref ref-type="bibr" rid="ref36">36</xref>], 2019</td>
              </tr>
              <tr valign="top">
                <td>15</td>
                <td>FHIR Healthcare Directories: Adopting Shared Interfaces to Achieve Interoperable Medical Device Data Integration</td>
                <td>Tyndall and Tyndall [<xref ref-type="bibr" rid="ref37">37</xref>], 2018</td>
              </tr>
              <tr valign="top">
                <td>16</td>
                <td>ProvCaRe: Characterizing Scientific Reproducibility of Biomedical Research Studies using Semantic Provenance Metadata</td>
                <td>Sahoo et al [<xref ref-type="bibr" rid="ref38">38</xref>], 2019</td>
              </tr>
              <tr valign="top">
                <td>17</td>
                <td>Embedding data provenance into the Learning Health System to facilitate reproducible research</td>
                <td>Curcin [<xref ref-type="bibr" rid="ref4">4</xref>], 2017</td>
              </tr>
              <tr valign="top">
                <td>18</td>
                <td>Application of Data Provenance in Healthcare Analytics Software Information Visualisation of User Activities</td>
                <td>Xu et al [<xref ref-type="bibr" rid="ref39">39</xref>], 2018</td>
              </tr>
              <tr valign="top">
                <td>19</td>
                <td>AiiDA 1.0, a scalable computational infrastructure for automated reproducible workflows and data provenance</td>
                <td>Huber et al [<xref ref-type="bibr" rid="ref40">40</xref>], 2020</td>
              </tr>
              <tr valign="top">
                <td>20</td>
                <td>Provenance for distributed biomedical workflow execution</td>
                <td>Madougou et al [<xref ref-type="bibr" rid="ref41">41</xref>], 2012</td>
              </tr>
              <tr valign="top">
                <td>21</td>
                <td>Capturing and Analyzing Provenance from Spark-based Scientific Workflows with SAMbA-RaP</td>
                <td>Guedes et al [<xref ref-type="bibr" rid="ref42">42</xref>], 2020</td>
              </tr>
              <tr valign="top">
                <td>22</td>
                <td>Why-Diff: Exploiting Provenance to Understand Outcome Differences From Non-Identical Reproduced Workflows</td>
                <td>Thavasimani et al [<xref ref-type="bibr" rid="ref43">43</xref>], 2019</td>
              </tr>
              <tr valign="top">
                <td>23</td>
                <td>Deriving scientific workflows from algebraic experiment lines: A practical approach</td>
                <td>Marinho et al [<xref ref-type="bibr" rid="ref44">44</xref>], 2017</td>
              </tr>
              <tr valign="top">
                <td>24</td>
                <td>Access control and view generation for provenance graphs</td>
                <td>Danger et al [<xref ref-type="bibr" rid="ref45">45</xref>], 2015</td>
              </tr>
              <tr valign="top">
                <td>25</td>
                <td>Provenance-based reproducibility in the Semantic Web</td>
                <td>Moreau [<xref ref-type="bibr" rid="ref46">46</xref>], 2011</td>
              </tr>
              <tr valign="top">
                <td>26</td>
                <td>PASSing the Provenance challenge</td>
                <td>Holland et al [<xref ref-type="bibr" rid="ref47">47</xref>], 2008</td>
              </tr>
              <tr valign="top">
                <td>27</td>
                <td>Decentralised provenance for healthcare data</td>
                <td>Margheri et al [<xref ref-type="bibr" rid="ref48">48</xref>], 2020</td>
              </tr>
              <tr valign="top">
                <td>28</td>
                <td>Enhancing Traceability in Clinical Research Data through a Metadata Framework.</td>
                <td>Hume et al [<xref ref-type="bibr" rid="ref12">12</xref>], 2020</td>
              </tr>
              <tr valign="top">
                <td>29</td>
                <td>Scientific Reproducibility in Biomedical Research: Provenance Metadata Ontology for Semantic Annotation of Study Description</td>
                <td>Sahoo et al [<xref ref-type="bibr" rid="ref49">49</xref>], 2016</td>
              </tr>
              <tr valign="top">
                <td>30</td>
                <td>Managing and exploiting routinely collected NHS data for research</td>
                <td>Curcin et al [<xref ref-type="bibr" rid="ref50">50</xref>], 2013</td>
              </tr>
              <tr valign="top">
                <td>31</td>
                <td>The eGenVar data management system—cataloguing and sharing sensitive data and metadata for the life sciences</td>
                <td>Razick et al [<xref ref-type="bibr" rid="ref51">51</xref>], 2014</td>
              </tr>
              <tr valign="top">
                <td>32</td>
                <td>BioQ: tracing experimental origins in public genomic databases using a novel data provenance model</td>
                <td>Saccone et al [<xref ref-type="bibr" rid="ref52">52</xref>], 2012</td>
              </tr>
              <tr valign="top">
                <td>33</td>
                <td>Applications of provenance in performance prediction and data storage optimisation</td>
                <td>Woodman et al [<xref ref-type="bibr" rid="ref53">53</xref>], 2017</td>
              </tr>
              <tr valign="top">
                <td>34</td>
                <td>ProvManager: a provenance management system for scientific workflows</td>
                <td>Marinho et al [<xref ref-type="bibr" rid="ref54">54</xref>], 2012</td>
              </tr>
              <tr valign="top">
                <td>35</td>
                <td>Provenance in collection-oriented scientific workflows</td>
                <td>Bowers et al [<xref ref-type="bibr" rid="ref55">55</xref>], 2008</td>
              </tr>
              <tr valign="top">
                <td>36</td>
                <td>A novel approach to provenance management for privacy preservation</td>
                <td>Can and Yilmazer [<xref ref-type="bibr" rid="ref56">56</xref>], 2020</td>
              </tr>
              <tr valign="top">
                <td>37</td>
                <td>Templates as a method for implementing data provenance in decision support systems</td>
                <td>Curcin et al [<xref ref-type="bibr" rid="ref57">57</xref>], 2017</td>
              </tr>
              <tr valign="top">
                <td>38</td>
                <td>Sharing interoperable workflow provenance: A review of best practices and their practical application in CWLProv</td>
                <td>Khan et al [<xref ref-type="bibr" rid="ref58">58</xref>], 2019</td>
              </tr>
              <tr valign="top">
                <td>39</td>
                <td>PAV ontology: provenance, authoring and versioning</td>
                <td>Ciccarese et al [<xref ref-type="bibr" rid="ref59">59</xref>], 2013</td>
              </tr>
              <tr valign="top">
                <td>40</td>
                <td>Enabling precision medicine via standard communication of HTS provenance, analysis, and results</td>
                <td>Alterovitz et al [<xref ref-type="bibr" rid="ref60">60</xref>], 2018</td>
              </tr>
              <tr valign="top">
                <td>41</td>
                <td>NeuroProv: Provenance data visualisation for neuroimaging analyses</td>
                <td>Arshad et al [<xref ref-type="bibr" rid="ref61">61</xref>], 2019</td>
              </tr>
              <tr valign="top">
                <td>42</td>
                <td>AVOCADO: Visualization of Workflow-Derived Data Provenance for Reproducible Biomedical Research</td>
                <td>Stitz et al [<xref ref-type="bibr" rid="ref62">62</xref>], 2016</td>
              </tr>
              <tr valign="top">
                <td>43</td>
                <td>Provenance Context Entity (PaCE): Scalable Provenance Tracking for Scientific RDF Data</td>
                <td>Sahoo et al [<xref ref-type="bibr" rid="ref63">63</xref>], 2010</td>
              </tr>
              <tr valign="top">
                <td>44</td>
                <td>A semantic proteomics dashboard (SemPoD) for data management in translational research</td>
                <td>Jayapandian et al [<xref ref-type="bibr" rid="ref2">2</xref>], 2012</td>
              </tr>
              <tr valign="top">
                <td>45</td>
                <td>Providing traceability for neuroimaging analyses</td>
                <td>McClatchey et al [<xref ref-type="bibr" rid="ref64">64</xref>], 2013</td>
              </tr>
              <tr valign="top">
                <td>46</td>
                <td>PGxO and PGxLOD: a reconciliation of pharmacogenomic knowledge of various provenances, enabling further comparison</td>
                <td>Monnin et al [<xref ref-type="bibr" rid="ref65">65</xref>], 2019</td>
              </tr>
              <tr valign="top">
                <td>47</td>
                <td>Provenance data discovery through Semantic Web resources</td>
                <td>Ornelas et al [<xref ref-type="bibr" rid="ref66">66</xref>], 2018</td>
              </tr>
              <tr valign="top">
                <td>48</td>
                <td>Characterizing workflow-based activity on a production e-infrastructure using provenance data</td>
                <td>Madougou et al [<xref ref-type="bibr" rid="ref67">67</xref>], 2013</td>
              </tr>
              <tr valign="top">
                <td>49</td>
                <td>Storing, reasoning, and querying OPM-compliant scientific workflow provenance using relational databases</td>
                <td>Lim et al [<xref ref-type="bibr" rid="ref68">68</xref>], 2011</td>
              </tr>
              <tr valign="top">
                <td>50</td>
                <td>Blockchain for Healthcare: Securing Patient Data and Enabling Trusted Artiﬁcial Intelligence</td>
                <td>Jennath et al [<xref ref-type="bibr" rid="ref69">69</xref>], 2020</td>
              </tr>
              <tr valign="top">
                <td>51</td>
                <td>Bio-Swarm-Pipeline: a light-weight, extensible batch processing system for efficient biomedical data processing</td>
                <td>Cheng et al [<xref ref-type="bibr" rid="ref70">70</xref>], 2009</td>
              </tr>
              <tr valign="top">
                <td>52</td>
                <td>A Comprehensive Query Language for Provenance Information</td>
                <td>Jabal and Bertino [<xref ref-type="bibr" rid="ref71">71</xref>], 2018</td>
              </tr>
              <tr valign="top">
                <td>53</td>
                <td>Provenance trails in the Wings/Pegasus system</td>
                <td>Kim et al [<xref ref-type="bibr" rid="ref72">72</xref>], 2008</td>
              </tr>
              <tr valign="top">
                <td>54</td>
                <td>OPQL: Querying scientific workflow provenance at the graph level</td>
                <td>Lim et al [<xref ref-type="bibr" rid="ref73">73</xref>], 2013</td>
              </tr>
              <tr valign="top">
                <td>55</td>
                <td>Lightweight Distributed Provenance Model for Complex Real-world Environments</td>
                <td>Wittner et al [<xref ref-type="bibr" rid="ref74">74</xref>], 2022</td>
              </tr>
              <tr valign="top">
                <td>56</td>
                <td>A collaborative semantic-based provenance management platform for reproducibility</td>
                <td>Samuel and Konig-Ries [<xref ref-type="bibr" rid="ref75">75</xref>], 2022</td>
              </tr>
              <tr valign="top">
                <td>57</td>
                <td>A novel visualization approach for data provenance</td>
                <td>Yazici et al [<xref ref-type="bibr" rid="ref76">76</xref>], 2022</td>
              </tr>
              <tr valign="top">
                <td>58</td>
                <td>Trellis for efficient data and task management in the VA Million Veteran Program</td>
                <td>Ross et al [<xref ref-type="bibr" rid="ref77">77</xref>], 2021</td>
              </tr>
              <tr valign="top">
                <td>59</td>
                <td>ECO: the Evidence and Conclusion Ontology, an update for 2022</td>
                <td>Nadendla et al [<xref ref-type="bibr" rid="ref78">78</xref>], 2022</td>
              </tr>
              <tr valign="top">
                <td>60</td>
                <td>RepeatFS: a file system providing reproducibility through provenance and automation.</td>
                <td>Westbrook et al [<xref ref-type="bibr" rid="ref79">79</xref>], 2021</td>
              </tr>
              <tr valign="top">
                <td>61</td>
                <td>The BMS-LM ontology for biomedical data reporting throughout the life cycle of a research study: From data model to ontology</td>
                <td>Raboudi et al [<xref ref-type="bibr" rid="ref80">80</xref>], 2022</td>
              </tr>
              <tr valign="top">
                <td>62</td>
                <td>FAIRSCAPE: a Framework for FAIR and Reproducible Biomedical Analytics</td>
                <td>Levinson et al [<xref ref-type="bibr" rid="ref81">81</xref>], 2021</td>
              </tr>
              <tr valign="top">
                <td>63</td>
                <td>FAIRly big: A framework for computationally reproducible processing of large-scale data</td>
                <td>Wagner et al [<xref ref-type="bibr" rid="ref82">82</xref>], 2022</td>
              </tr>
              <tr valign="top">
                <td>64</td>
                <td>FAIR data pipeline: provenance-driven data management for traceable scientific workflows</td>
                <td>Mitchell et al [<xref ref-type="bibr" rid="ref83">83</xref>], 2022</td>
              </tr>
              <tr valign="top">
                <td>65</td>
                <td>Enabling Scientific Reproducibility through FAIR Data Management: An ontology-driven deep learning approach in the NeuroBridge Project</td>
                <td>Wang et al [<xref ref-type="bibr" rid="ref84">84</xref>], 2022</td>
              </tr>
              <tr valign="top">
                <td>66</td>
                <td>The Neuroscience Experiments System (NES)-A Software Tool to Manage Experimental Data and Its Provenance</td>
                <td>Ruiz-Olazar et al [<xref ref-type="bibr" rid="ref85">85</xref>], 2021</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) flow diagram displaying the paper selection process with the number of studies in the identification and screening phases and all included studies in the scoping review.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e51297_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Characteristics of the Included Studies</title>
        <p>All papers (n=66) were first published between 2006 and 2022 (<xref ref-type="table" rid="table2">Table 2</xref>). More than half of the reviewed studies were published within the past 5 years, which we selected for our scoping review. Predominantly, studies originated from the biomedical or health care domain (45/66, 68%), followed by the domain-independent studies (21/66, 32%). Document characteristics of the study corpus are provided in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
        <p>All studies in this review were screened with regard to the 5 RQs described in the Methods section. The following subsections describe our findings for RQ1 to RQ5.</p>
      </sec>
      <sec>
        <title>RQ1: Classification and Tracking of Provenance Criteria in Biomedical Workflows and Data</title>
        <sec>
          <title>RQ1.1: Characteristics of Provenance Framework Types</title>
          <p>Heterogeneous approaches for classifying and tracking provenance criteria have been reported in the selected literature (n=66). We propose to categorize them by their focus (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). Most articles (58/66, 88%) focused explicitly on practical provenance management approaches. The remaining theoretical frameworks (8/66, 12%) provided recommendations or reviews. They can be classified into the following subcategories.</p>
        </sec>
        <sec>
          <title>Semantics and Models, Ontologies, and Metadata (27/58, 47%)</title>
          <p>This comprises provenance-tracking approaches on different granularity, ontology, and model abstraction levels. The semantic Provenance Context Entity approach [<xref ref-type="bibr" rid="ref63">63</xref>] was developed to track provenance in Resource Description Framework–based semantic web applications. An example of an annotation mechanism was introduced with collection-oriented modeling and design [<xref ref-type="bibr" rid="ref55">55</xref>]. The Provenance Metadata Model (ProvCaRe S3), supporting scientific reproducibility, was represented with the Web Ontology Language and provenance triples served as a basis for the provenance graph [<xref ref-type="bibr" rid="ref38">38</xref>]. Later, the NeuroBridge ontology extended ProvCaRe, combined with a deep learning model [<xref ref-type="bibr" rid="ref84">84</xref>]. Further ontologies include the REPRODUCE-ME ontology, integrated in the CAESAR project [<xref ref-type="bibr" rid="ref75">75</xref>], or the BioMedical Study–Lifecycle Management core ontology [<xref ref-type="bibr" rid="ref80">80</xref>]. application programming interfaces for visualization [<xref ref-type="bibr" rid="ref71">71</xref>] or querying purposes [<xref ref-type="bibr" rid="ref28">28</xref>] and web services for user access to provenance data [<xref ref-type="bibr" rid="ref2">2</xref>] were reported.</p>
        </sec>
        <sec>
          <title>Scientific Workflows and Workflow Executions (18/58, 31%)</title>
          <p>These are mainly Open Provenance Model (OPM)–oriented workflows [<xref ref-type="bibr" rid="ref86">86</xref>] on different semantic levels, like in the BioWorkbench [<xref ref-type="bibr" rid="ref27">27</xref>], OpenPREDICT [<xref ref-type="bibr" rid="ref29">29</xref>], or Web Ontology Language projects. Provenance data were stored in relational databases, like in OPMProv [<xref ref-type="bibr" rid="ref73">73</xref>] or in graph databases [<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref77">77</xref>]. Querying possibilities were offered via a web service or with specific querying languages at the graph level [<xref ref-type="bibr" rid="ref73">73</xref>].</p>
        </sec>
        <sec>
          <title>Privacy Aspects (5/58, 9%)</title>
          <p>Decentralized management and General Data Protection Regulation requirements led to the use of blockchain technologies [<xref ref-type="bibr" rid="ref48">48</xref>] in combination with the PROV model standard. Another scenario incorporated blockchain in a proof-of-concept study [<xref ref-type="bibr" rid="ref69">69</xref>] to enable an audit trail mechanism for a trusted artificial intelligence model.</p>
        </sec>
        <sec>
          <title>Visualization Aspect (4/58, 7%)</title>
          <p>The complexity of representing provenance information at different levels of aggregation was examined in the AVOCADO project [<xref ref-type="bibr" rid="ref62">62</xref>]. The NeuroProv project [<xref ref-type="bibr" rid="ref61">61</xref>] shows how visualization supports clinicians in information tracking and reproducibility analysis.</p>
        </sec>
        <sec>
          <title>General Data Managing Tools (4/58, 7%)</title>
          <p>Frameworks provide different modules for data and workflow provenance capture, representation, storage, comparison, and visualization [<xref ref-type="bibr" rid="ref75">75</xref>] or automatic recomputation of arbitrary data-processing results [<xref ref-type="bibr" rid="ref82">82</xref>].</p>
        </sec>
        <sec>
          <title>RQ1.2: Provenance Model Characteristics</title>
          <p>At all, 58 papers reported about provenance model characteristics. The dominant provenance models refer to the PROV [<xref ref-type="bibr" rid="ref8">8</xref>] specification (25/58, 43%), established by the World Wide Web Consortium (W3C) as the de facto standard for provenance modeling, and the frequently used OPM [<xref ref-type="bibr" rid="ref86">86</xref>] (17/58, 29%; <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>). Other models cite specific solutions (11/58, 19%), are concerned with metadata provision (5/58, 9%), or do not provide any information on the provenance model (8/58, 14%).</p>
          <p>OPM is the result of 3 provenance challenges (since 2011 until today). OPM (version 1.1) is exchangeable across systems and supports a process-oriented and dataflow-oriented view. It is based on the notion of the annotated causality graph with nodes as artifacts, processes, and agents. OPM was further developed into a provenance data model. PROV [<xref ref-type="bibr" rid="ref8">8</xref>] comprises a family of specifications for provenance, designed to promote the publication of provenance information on the web. It offers interoperability across systems and is quite generic.</p>
          <p><xref rid="figure2" ref-type="fig">Figure 2</xref> displays the temporal evolution of the characterized frameworks depending on the applied models. We observed an increased number of papers relating to these provenance management frameworks between 2016 and 2022. At this time, the OPM and W3C PROV standards were extended. The onset of the FAIR principles [<xref ref-type="bibr" rid="ref29">29</xref>] and the Fast Healthcare Interoperability Resources framework [<xref ref-type="bibr" rid="ref40">40</xref>] furthermore set new requirements for modeling and implementation projects.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Reported provenance management frameworks per year. The size of the ring corresponds with the number of articles per year that discuss a specific model (color-coded) in the context of the respective framework. OPM: Open Provenance Model; W3C: World Wide Web Consortium.</p>
            </caption>
            <graphic xlink:href="jmir_v26i1e51297_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>RQ1.3: Validation Status</title>
          <p>Most of the studies (n=52) report a successful validation of their provenance solution. The use cases were mostly domain-specific (eg, as part of the AVOCADO [<xref ref-type="bibr" rid="ref62">62</xref>] project). Other authors chose classical semantic evaluation schemes that demonstrated feasibility by responding to competency questions. Examples are the provenance challenges or proof-of-concept frameworks [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref72">72</xref>].</p>
          <p>To pass the provenance challenges, participants needed to solve predefined provenance queries [<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref73">73</xref>]. Can and Yilmazer [<xref ref-type="bibr" rid="ref56">56</xref>] evaluated their domain-independent model with an infectious disease use case and implementing the Healthcare Provenance Information System. Sometimes, more than one approach had been taken for evaluation (eg, use cases and factors, ontology validation, and a user-based study were applied to evaluate the CAESAR approach for scientific experiments [<xref ref-type="bibr" rid="ref75">75</xref>]). A prototype visualization tool for provenance information used satisfaction surveys to assess the usability of the system [<xref ref-type="bibr" rid="ref76">76</xref>].</p>
          <p>Curcin et al [<xref ref-type="bibr" rid="ref57">57</xref>] emphasized that the setup of provenance data needs to be modeled and verified separately from the software implementation. Precise validation methods for provenance services focus on usability, performance, scalability, fault tolerance, and functionality [<xref ref-type="bibr" rid="ref64">64</xref>]. Moreover, they demanded more formal engineering techniques to foster provenance implementation across a broad range of software tools in the biomedical domain and beyond [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref74">74</xref>]. In that sense, formal validation as part of the software engineering process contributes to increased software quality, and formal validation requires testing efforts and testing evidence. However, accurate alignment of testing procedures against predefined requirements in the software life cycle could not be identified.</p>
        </sec>
        <sec>
          <title>RQ1.4: Provenance Characteristics</title>
          <p>The term <italic>provenance</italic> is subjected to an evolutionary and technical process with multifaceted meanings and roles in the selected papers (n=66). There is agreement that provenance is a piece of history. However, the focus of provenance work ranges from abstract workflow descriptions to summaries of workflow executions to more general knowledge about data sources and result dependencies [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref73">73</xref>]. For example, provenance as semantic metadata was specified in several works between 2007 and 2019. Monnin et al [<xref ref-type="bibr" rid="ref65">65</xref>] required the encoding of provenance of pharmacogenomics knowledge units. Other works refer to data provenance as knowledge about data sources [<xref ref-type="bibr" rid="ref45">45</xref>] or as a piece of analytic software [<xref ref-type="bibr" rid="ref39">39</xref>], as machine-interpretable provenance of data sets, as software and computations, as metadata for all computed results [<xref ref-type="bibr" rid="ref81">81</xref>], or as the description of the data and its original context, and tracing data history from their creation to their sharing [<xref ref-type="bibr" rid="ref80">80</xref>].</p>
          <p>Sahoo et al [<xref ref-type="bibr" rid="ref38">38</xref>] stated that the provenance data model together with the PROV Ontology define the minimal categories of provenance metadata terms. Other studies discussed the combined provenance of data and workflows and introduce the terms <italic>prospective</italic>, <italic>retrospective</italic>, and <italic>domain provenance</italic> [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref59">59</xref>]. While prospective provenance expresses future abstract workflow information, retrospective provenance gathers past workflow execution and data derivation information. Domain-specific provenance can be defined as an extension to the PROV Ontology. Workflow provenance has repeatedly been mentioned in the context of workflow execution [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. Wittner et al [<xref ref-type="bibr" rid="ref74">74</xref>] introduced the term <italic>provenance backbone</italic>, which covers coarse granularity representation of traceable object artifacts, whereas Mitchell et al [<xref ref-type="bibr" rid="ref83">83</xref>] expressed provenance in relation to intrinsic and extrinsic metadata. The “FAIRly big framework” [<xref ref-type="bibr" rid="ref82">82</xref>] demonstrates how records of process provenance are captured and stored in a machine-readable, automatically re-executable way. The 7 Ws (who, what, where, why, when, which, and how) characterize provenance in the study by Ruiz-Olazar et al [<xref ref-type="bibr" rid="ref85">85</xref>].</p>
        </sec>
        <sec>
          <title>RQ1.5: Requirements for Provenance Frameworks</title>
          <p>Out of 66 reviewed papers, 44 (67%) papers mentioned ≥1 functional and nonfunctional requirements for the referenced framework type. However, 33% (22/66) of the papers did not identify any specific requirements. For those studies that did, we identified 9 different word fields, matched them (<xref rid="figure3" ref-type="fig">Figure 3</xref>), and explained the citations (<xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>).</p>
          <p>Intensive interdisciplinary work on requirements analysis has been undertaken [<xref ref-type="bibr" rid="ref75">75</xref>,<xref ref-type="bibr" rid="ref83">83</xref>]. As such, a workshop with scientists from multiple disciplines (biology, computer science, ecology, and chemistry) and an exploratory study [<xref ref-type="bibr" rid="ref75">75</xref>] contribute to requirements collection in the epidemiological field [<xref ref-type="bibr" rid="ref83">83</xref>]. Another way to identify requirements is based on exhaustive literature research and interviews with domain specialists [<xref ref-type="bibr" rid="ref85">85</xref>]. <xref rid="figure3" ref-type="fig">Figure 3</xref> visualizes the reported provenance requirements. The most popular requirements refer to the word fields integrity (16/44, 36%) and reproducibility (13/44, 30%), followed by interoperability, traceability, and performance or scalability related topics (each 9/44, 20%). Others were related to the word fields organizational and security (each 8/44, 18%). Only a few studies reported on trust (5/44, 11%) and usability (3/44, 7%) linked approaches.</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Reported provenance requirements or factors by word fields. The line thickness in the first level proportionally reflects the respective characteristics count. The second level displays all occurred requirement classes.</p>
            </caption>
            <graphic xlink:href="jmir_v26i1e51297_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>RQ1.6: Domain-Specific Conditions Including Guidelines</title>
          <p>Some papers reported domain-specific standards for provenance (n=17). Beyond the W3C standards, we identified the Open Archival Information System Functional Model as a basis for the development of a research object concept [<xref ref-type="bibr" rid="ref32">32</xref>]. Another example is the International Organization for Standardization (ISO) 15489-1, which defines the term <italic>metadata</italic> [<xref ref-type="bibr" rid="ref51">51</xref>] or the Technical Committee 276 “Biotechnology” ISO, which standardizes provenance information for the biotechnology domain [<xref ref-type="bibr" rid="ref74">74</xref>]. The National Institutes of Health guideline “Rigor and Reproducibility” [<xref ref-type="bibr" rid="ref49">49</xref>] addresses topics impeding the study replicability. The FAIR principles explicitly guided data management practices in studies [<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref83">83</xref>]. The FAIRSCAPE framework presented standards and interoperability such as JSON-LD, W3C PROV or CAT, DOI, and EVI’s formal model as extension to W3C as evidence chains that support or challenge a result [<xref ref-type="bibr" rid="ref81">81</xref>].</p>
        </sec>
      </sec>
      <sec>
        <title>RQ2: Potential Value of Provenance Information</title>
        <sec>
          <title>RQ2.1: Impact of Provenance Information</title>
          <p>In our review, a total of 42 papers reported about various impacts (n=99) on different stakeholders (<xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>). The availability of provenance data impacts the scientific and biomedical communities (<xref rid="figure4" ref-type="fig">Figure 4</xref>). With regard to the work of researchers, scientists, academia, investigators, and clinicians (n=64), most papers reported guidance benefits (19/64, 30%) and reproducibility-related effects (12/64, 19%). Considerably fewer papers observed validity (4/64, 6%), managing influence (4/64, 6%), reusability (5/64, 8%) and confidence effects (6/64, 9%). Other studies reported that provenance information impacts the willingness to share knowledge (6/64, 9%), for example, by providing a unified repository for the experimental data for the research group [<xref ref-type="bibr" rid="ref82">82</xref>,<xref ref-type="bibr" rid="ref85">85</xref>]. Interestingly, only 13% (8/64) of the studies discussed implications on the quality of research (eg, [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref78">78</xref>,<xref ref-type="bibr" rid="ref84">84</xref>]).</p>
          <p>Other involved team or staff members (n=22) such as developers, data managers, or domain experts were also affected by the availability of provenance information. The majority recognizes benefits in validity (5/22, 23%) [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref61">61</xref>] and managing benefits (8/22, 36%) [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref76">76</xref>,<xref ref-type="bibr" rid="ref80">80</xref>,<xref ref-type="bibr" rid="ref83">83</xref>] followed by guidance benefits (5/22, 23%) [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref83">83</xref>]. In addition, reproducibility (3/22, 14%) [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref79">79</xref>] and reusability (1/22, 4%) impacts were mentioned.</p>
          <p>Only low impact on patients (n=7) was described, mostly referring to the consent of their data (5/7, 71%) [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref69">69</xref>] to an improved measurable patient outcome and trust in evidence for clinical recommendations (each 1/7, 14%) [<xref ref-type="bibr" rid="ref57">57</xref>].</p>
          <p>Only a few effects on other third parties (n=6) such as data privacy officers, authorities, government, or industry were reported. Related implications concerned mainly the evidence for data validity or sensitive data-processing solutions [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref83">83</xref>].</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Reported impacts of provenance information. Level 1 presents the stakeholder groups and level 2 presents the impacts on the stakeholders. The line thickness in the second level proportionally reflects the respective counts of the characteristics.</p>
            </caption>
            <graphic xlink:href="jmir_v26i1e51297_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>RQ2.2: Data Sources</title>
          <p>A large number of papers (n=42) reported studies processed different types of data sources to generate provenance information, for example, neurological data [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref84">84</xref>,<xref ref-type="bibr" rid="ref85">85</xref>], with large-scale data from the brain imaging component of the UK Biobank project [<xref ref-type="bibr" rid="ref82">82</xref>], electronic health record data [<xref ref-type="bibr" rid="ref27">27</xref>], study data [<xref ref-type="bibr" rid="ref62">62</xref>], animals data [<xref ref-type="bibr" rid="ref80">80</xref>], pathology data [<xref ref-type="bibr" rid="ref74">74</xref>], omics data [<xref ref-type="bibr" rid="ref52">52</xref>], biomedical or medical data [<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref78">78</xref>], computational data [<xref ref-type="bibr" rid="ref72">72</xref>], time-series analysis of neonatal intensive care unit data [<xref ref-type="bibr" rid="ref81">81</xref>], and data from hybrid methods [<xref ref-type="bibr" rid="ref69">69</xref>].</p>
        </sec>
      </sec>
      <sec>
        <title>RQ3: Challenges, Problems, and Bottlenecks</title>
        <p>Overall, 47 papers reported 74 distinct challenges impeding the implementation of provenance. We categorized these challenges into organizational and technical groups, provided details (<xref ref-type="supplementary-material" rid="app8">Multimedia Appendix 8</xref>) and presented a temporal overview of the challenges (<xref rid="figure5" ref-type="fig">Figure 5</xref>). In summary, issues are related to data annotation, metadata, and modeling of provenance, as well as performance-related challenges. However, the need for more detailed provenance information; consideration of compliance managing topics (eg, security-related conditions); and adherence to quality and software engineering principles such as exchange, discovery, and interoperability emerged later in the course. Furthermore, usability and scalability questions emerged very early in context with provenance consumption.</p>
        <p>More than three-quarters of the reported challenges are technical (64/74, 86%). Thereof, approximately one-fourth is associated with provenance granularity issues (15/64, 23%). Curcin et al [<xref ref-type="bibr" rid="ref1">1</xref>] pointed out that a granular tracking of relevant human interactions, automated processes, or logging is needed and emphasized the difficulty of choosing a proper level of granularity of provenance and associated with this, the right semantic complexity [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref57">57</xref>]. Beyond that, a balanced trade-off between fast execution and provenance granularity must be found [<xref ref-type="bibr" rid="ref42">42</xref>]. In fact, a fine-granular provenance level impacts the computing and storage resources [<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref58">58</xref>]. Furthermore, managing sensitive data restriction requires the integration of adequate security level granularity into the provenance model [<xref ref-type="bibr" rid="ref56">56</xref>].</p>
        <p>Approximately one-third of the reported challenges (20/64, 31%) either mention the insufficient availability of metadata—which subsequently leads to incomplete provenance models—that claims the terminological heterogeneity in the metadata terms associated with study data sets [<xref ref-type="bibr" rid="ref84">84</xref>] or does not conform to explicit annotation standards [<xref ref-type="bibr" rid="ref82">82</xref>]. An improved availability of provenance metadata and FAIR enrichment of the data was demanded [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref80">80</xref>]. Furthermore, stakeholders should be involved in the semantic enrichment of provenance data [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref51">51</xref>]. However, during this metadata annotation phase, a lack of semiautomated procedures for ontology selection, semantic modeling, or mapping techniques was reported [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref51">51</xref>]. Although the use of existing models is encouraged [<xref ref-type="bibr" rid="ref59">59</xref>], as it improves semantic interoperability [<xref ref-type="bibr" rid="ref29">29</xref>], the reuse of vocabularies to represent provenance information remains an extensive task [<xref ref-type="bibr" rid="ref29">29</xref>]. Cheng et al [<xref ref-type="bibr" rid="ref70">70</xref>] noted that it was necessary to properly integrate domain-specific demands into the provenance model. Ruiz-Olazar et al [<xref ref-type="bibr" rid="ref85">85</xref>] claimed that a unified data model for handling metadata is still missing.</p>
        <p>One-fifth of the studies (14/64, 22%) reported performance problems during the acquisition of provenance data, such as workflow overhead [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref73">73</xref>] and scalability [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref85">85</xref>] issues. Increasing data volumes hamper the processing of provenance visualization and stream handling [<xref ref-type="bibr" rid="ref76">76</xref>]. One proposal with respect to the cost-intensive visualization was to reduce the size of large provenance graphs [<xref ref-type="bibr" rid="ref39">39</xref>]. Other authors reported challenges with quality [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref52">52</xref>] and usability [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref70">70</xref>,<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref75">75</xref>]. According to the literature, data quality and reuse are lacking due to the deficit in provenance deployment, particularly for observational and administrative studies [<xref ref-type="bibr" rid="ref26">26</xref>]. Furthermore, the lack of information about experimental origins in genomics data and their related systematic quality control assessment reduce the quality of provenance and the level of creditability [<xref ref-type="bibr" rid="ref52">52</xref>]. In particular, the low uptake of high-quality semantic models [<xref ref-type="bibr" rid="ref9">9</xref>] and the unavailability of provenance in general [<xref ref-type="bibr" rid="ref36">36</xref>] cause information loss and data quality issues. A minor concern is the usability because provenance is recognized to be still in infancy [<xref ref-type="bibr" rid="ref73">73</xref>]. The challenge of applying more software engineering techniques (4/64, 6%) [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref67">67</xref>] was reported to facilitate provenance implementation across a broad range of software tools in the biomedical domain and beyond [<xref ref-type="bibr" rid="ref1">1</xref>].</p>
        <p>Significantly fewer organizational challenges (10/74, 13%) [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref56">56</xref>-<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref64">64</xref>,<xref ref-type="bibr" rid="ref69">69</xref>,<xref ref-type="bibr" rid="ref73">73</xref>] were reported, partly attributable to a basic unawareness of provenance benefits and less exchange between stakeholders. Khan et al [<xref ref-type="bibr" rid="ref58">58</xref>] stressed that provenance capture must be established as a standard practice, not as an afterthought. McClatchey et al [<xref ref-type="bibr" rid="ref64">64</xref>] also recommended working toward gaining the stakeholder’s acceptance and confidence in the infrastructure. In the same vein, it is recommended to integrate developers already in the design phase [<xref ref-type="bibr" rid="ref1">1</xref>]. However, financial challenges were reported due to the necessary investments in provenance-enabled tooling and capabilities [<xref ref-type="bibr" rid="ref4">4</xref>]. The upcoming relevance of patient-mediated data handling raised new challenges and requirements, especially with respect to policy and governance topics [<xref ref-type="bibr" rid="ref69">69</xref>] and rigorous validation approaches [<xref ref-type="bibr" rid="ref74">74</xref>].</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Challenges per year of publication. The size of and the numbers in the circles represent the number of articles that reveal a challenge (color-coded). Note that numbers are omitted for single articles per category.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e51297_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>RQ4: Demands</title>
        <p>Because of the extensive information obtained from RQ1, we extended the RQs to gain more insights into the provenance tracing and classification requirements identified in RQ1.</p>
        <p>Interestingly, most of the 15 papers referred to claims relating to quality aspects.</p>
        <p>For example, a more robust assessment of data quality is required [<xref ref-type="bibr" rid="ref36">36</xref>], and clearer and more consistent policies and policy ontologies are requested to prevent disclosure of sensitive data [<xref ref-type="bibr" rid="ref56">56</xref>] and more trained staff is required [<xref ref-type="bibr" rid="ref50">50</xref>], including data managers, software architects, or semantic web specialists. User-friendly interfaces should help scientists in the provenance querying process [<xref ref-type="bibr" rid="ref54">54</xref>]. Developers should not only recognize technologies but also data model recommendations during the design phase [<xref ref-type="bibr" rid="ref1">1</xref>]. Performance of provenance reasoning needs to be improved [<xref ref-type="bibr" rid="ref68">68</xref>] and the further development of ontologies needs to be automated [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref49">49</xref>]. The term “intelligible machines” rather than “intelligent machines” was suggested to better respect the specific aspects of big data technologies in medical research [<xref ref-type="bibr" rid="ref57">57</xref>]. Integrating the Healthcare Enterprise standards, health care legacy protocols, interoperability, and legacy issues are furthermore mentioned [<xref ref-type="bibr" rid="ref48">48</xref>], and mappings between entities of various provenance models should be completed [<xref ref-type="bibr" rid="ref65">65</xref>]. Future integration into a recognized ISO standard similar to BioCompute was proposed [<xref ref-type="bibr" rid="ref60">60</xref>].</p>
      </sec>
      <sec>
        <title>RQ5: Completeness of Provenance Information</title>
        <p>The literature predominantly reports on a qualitative evaluation of completeness during the data management processes. However, we found one study describing a data management process dealing with metadata for traceability in clinical studies, which delivered complete provenance in this respect [<xref ref-type="bibr" rid="ref12">12</xref>]. Curcin [<xref ref-type="bibr" rid="ref4">4</xref>] proposed to incorporate provenance information in the validation against standards.</p>
        <p>One study applied data from 6 clinical research studies and &#62;100 variables to evaluate the coverage of the provenance ontology in the semantic annotation of the study descriptions [<xref ref-type="bibr" rid="ref49">49</xref>]. Two other documents invoked the need for minimal information elements to ensure sufficient process specification [<xref ref-type="bibr" rid="ref28">28</xref>] and the existence of rich provenance information for reconstructing and rerunning pipelines [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
        <p>A visualization of provenance data in neuroimaging took a semiqualitative approach for measuring the coverage. They mapped the metrics to use cases for the traceability of results and concluded that there is no absolute measure possible to verify the visualization approach [<xref ref-type="bibr" rid="ref61">61</xref>]. Arshad et al [<xref ref-type="bibr" rid="ref61">61</xref>] tested 15% of their workflows for verifiability of results, comparability of workflows, progression of the data for the analysis and origin of results, and evolution to see how data products evolved during an experiment.</p>
        <p>Furthermore, Sahoo et al [<xref ref-type="bibr" rid="ref38">38</xref>] examined the proportion of provenance metadata information across research articles using a qualitative hypothesis method. The method also provides a provenance ranking algorithm for the computation of a reproducibility rank for each article. The outcome of the self-contained DataLad data set presented valid, machine-actionable provenance information for every single result file of the performed data processing [<xref ref-type="bibr" rid="ref82">82</xref>].</p>
        <p>Numerical indication of completeness was not achieved in any of the other papers. However, the papers pointed out the advantages of provenance capture, for example, related to the longevity and accessibility of data after years [<xref ref-type="bibr" rid="ref40">40</xref>].</p>
      </sec>
      <sec>
        <title>Road Map for a Tailor-Made Provenance Framework</title>
        <p>On the basis of the insights obtained from the literature review, we developed a road map for the implementation of a tailor-made provenance framework (Provenance-SFL). This approach is based on the SFL for the development, provision, and management of software [<xref ref-type="bibr" rid="ref87">87</xref>]. The heterogeneous tracking approaches, their artifacts, and varying degrees of fulfillment of the RQs are depicted in <xref rid="figure6" ref-type="fig">Figure 6</xref> and determine our main discussion points.</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Road map toward a tailor-made provenance framework (Provenance-Software Framework Lifecycle [SFL]). The road map shows the 4 major processing phases in the inner circle segments: starting with the requirements definition, setup of the design based on the requirements, followed by coding and testing phases related to the given requirements and the implementation after successful testing. The outer and innermost circle present the mapped sections from our research questions approach to the Provenance-SFL. OPM: Open Provenance Model; W3C: World Wide Web Consortium.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e51297_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This scoping review presents various approaches and criteria for provenance tracking as a crucial aspect of research, especially in the biomedical domain. Our holistic view leads to an extensive summary of pooled research results, provides possible answers to the 5 RQs and discloses current knowledge gaps.</p>
        <p>Following the previously published scoping review protocol and the described deviation led us to include 66 full-text papers from initially 764 papers found in the PubMed and Web of Science databases. Using a structured and pretested data extraction sheet, contextual, but detailed, results were extracted to answer the 5 RQs defined in the protocol. The results of the scoping review led us to propose a Provenance-SFL road map, which distinguishes between the framework types and model characteristics, the validation status, and the requirement and provenance characteristics (<xref rid="figure6" ref-type="fig">Figure 6</xref>).</p>
        <p>Most models in this review referred to the W3C PROV and OPM standards. As shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>, an increased number of papers relate to the implementation frameworks published between 2016 and 2022. One reason for the increase in implementations might be the substantiation to extend W3C PROV and OPM [<xref ref-type="bibr" rid="ref58">58</xref>]. Another reason might be the increasing awareness of data management practices. At present, heterogeneous data sources, dynamic infrastructures, data exchange across boundaries, and a lack of standards for quality measures characterize the state of electronic health record data sets [<xref ref-type="bibr" rid="ref48">48</xref>].</p>
        <p>A provenance framework must acknowledge the semantic complexity of the domain and its relevant facets and requirements [<xref ref-type="bibr" rid="ref58">58</xref>] and the importance of good data management tooling and practices (<xref rid="figure2" ref-type="fig">Figure 2</xref>). In addition to requirements analysis, a thorough strategy is necessary to plan the typical data management steps such as collecting, managing, and analyzing data [<xref ref-type="bibr" rid="ref30">30</xref>]. According to Curcin [<xref ref-type="bibr" rid="ref4">4</xref>], validation readiness can be achieved by separating modeling and verification of provenance data from the software implementation. We agree that precise requirements analysis, as part of the software life cycle, and the subsequent individual life cycle steps, such as testing and maintenance procedures, support the consequent temporal evolution and hence improve the quality of provenance frameworks and applications.</p>
        <p>When incorporated in an inspection, provenance information must be sufficient for a content-related validation against applicable and accepted standards [<xref ref-type="bibr" rid="ref4">4</xref>]. Therefore, precise validation methods for provenance services regarding usability and performance, scalability, fault tolerance, and functionality are needed [<xref ref-type="bibr" rid="ref64">64</xref>]. We saw that validation approaches are linked to the evolution of provenance modeling and subsequent implementation attempts. Curcin et al [<xref ref-type="bibr" rid="ref1">1</xref>] argued that it was necessary to launch more formal software engineering techniques to foster provenance implementation across a broad range of software tools in the biomedical domain and beyond. In that sense, formal validation as part of the software engineering process contributes to increased software and data quality. Formal validation requires testing efforts and testing evidence. Accurate alignment of testing procedures against predefined requirements in the software life cycle could not be identified in the included papers.</p>
        <p>Provenance information is of high value for the scientific and biomedical community (eg, researchers); support staff (eg, developers); patients and other third parties (eg, data privacy officer or authority; <xref rid="figure4" ref-type="fig">Figure 4</xref>). It is interesting to see that despite the high impact of provenance (<xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>), only some stakeholders provide sufficient provenance information. Rather, it appears that responsibility for overall provenance management is being shifted to the support staff [<xref ref-type="bibr" rid="ref88">88</xref>]. We argue that available technology, IT knowledge, and data management skills need to be paired with both domain-specific knowledge and combined with constraints of legal nature or guidance [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]. This complexity indeed results in a very time-consuming business. However, automation and metadata collection can support this process [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. As a matter of fact, good provenance information strengthens the credibility of the data and proves that data have not been intentionally or unintentionally changed throughout the data life cycle [<xref ref-type="bibr" rid="ref89">89</xref>].</p>
        <p>We believe that the persisting disagreement on the interpretation of the term <italic>provenance</italic> hampers the uptake of existing frameworks. A unique understanding of the concepts surrounding provenance should be developed, followed by engineering efforts for modeling, implementation, and validation interventions. The ISO 8000-2:2022 standard [<xref ref-type="bibr" rid="ref90">90</xref>] defines the term <italic>data quality</italic> and clearly recommends defining degrees of requirements. This definition should be considered for use in provenance systems.</p>
        <p>With regard to the implementation of provenance systems, we observed that increasing legal and scientific demands require research projects to be implemented more transparently. However, the granularity of provenance could not yet be resolved and so-called knowledge bottlenecks [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref65">65</xref>] persist. It is important to understand that appropriate modeling of provenance information and effective provenance management techniques are required to protect sensitive provenance data.</p>
        <p>It furthermore remains unclear how to scale provenance systems for high amounts of data [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref58">58</xref>] (eg, how to store and represent provenance information in an aggregated and efficient manner or how to assist users in sophisticated provenance queries [<xref ref-type="bibr" rid="ref13">13</xref>]). Without doubt, automated and scalable solutions become impelling due to new challenges arising from the disposal and use of permanently increasing computing power [<xref ref-type="bibr" rid="ref40">40</xref>]. Growing focus is on the usability of the interface, particularly when provenance systems are implemented in the broad medical community, including patients, physicians, and researchers [<xref ref-type="bibr" rid="ref73">73</xref>].</p>
        <p>The lack of mandatory specifications or guidelines for provenance capture might be the reason why other papers only mention partial completeness. We strongly recommend doing more research on completeness checks as part of provenance tracing. The level of completeness and accuracy of provenance information of core data elements, especially in real-world data, could reveal data integrity issues and thus, affect the overall validity of the study results. Furthermore, reproducibility significantly depends on the accuracy of provenance information. For example, Mondelli et al [<xref ref-type="bibr" rid="ref27">27</xref>] delivered a tool for better scientific and longitudinal data management, which supports users, reproducibility by provenance, and reproduction through docker containers.</p>
        <p>Interestingly, the concept of “quality of provenance” is not clearly defined in any of the papers included for this review. We believe that data quality issues need to be addressed to reach completeness, accuracy, and timeliness of the data and to create trust in it.</p>
        <p>Another direction reveals the importance of good and systematic data management practices [<xref ref-type="bibr" rid="ref51">51</xref>] and the coordination with relevant stakeholders through the data life cycle. As such, first approaches toward interdisciplinary collaboration started within the MIRAPIE community project [<xref ref-type="bibr" rid="ref91">91</xref>] and were also recognized in the CAESAR project [<xref ref-type="bibr" rid="ref75">75</xref>].</p>
        <p>In summary, our review collects and structures the challenges during the accomplishment of provenance capture (<xref rid="figure5" ref-type="fig">Figure 5</xref>). Challenges that address missing or lacking organizational and technical capabilities were triangulated into more specific subcategories such as organizational (eg, investment and training and administrative) and technical (eg, granularity, performance and modeling and metadata annotation, delimitation reproducibility, and replicability) challenges.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>In the realm of similar studies, a recent systematic literature review by Sembay et al [<xref ref-type="bibr" rid="ref92">92</xref>] delved into provenance data management in health information systems. This review is a valuable resource if interested in the technical aspects, encompassing various methods, models, methodologies, and technologies associated with provenance data management in health information systems. It followed the guidelines proposed by Kitchenham and Charters [<xref ref-type="bibr" rid="ref93">93</xref>] for performing systematic literature reviews in software engineering. Another systematic literature review by Ahmed et al [<xref ref-type="bibr" rid="ref94">94</xref>] studied the impacts of data provenance in health care and General Data Protection Regulation compliance–based data provenance from a technological perspective. Although our RQ1 shares conceptual and domain-related similarities with the compared studies, there are notable differences in scope, RQs, methodological approaches, and thematic analysis focus.</p>
        <p>More than a year after we published our protocol and concluded the thematic analysis of our review findings, a scoping review on biomedical data provenance was published [<xref ref-type="bibr" rid="ref95">95</xref>]. The authors acknowledged and referenced our protocol. As they had anticipated, our review comprised 5 broad RQs, with the primary overlap occurring in RQ1. However, our scoping review offers more comprehensive results concerning the practical application of provenance and the associated challenges, including aspects such as completeness and validation. In addition, we provide in-depth descriptions of thematic areas and their subtopics, supported by tables, figures, and, most notably, a development of a tailor-made provenance framework road map. These aspects can be considered as the added value of our findings.</p>
        <p>Our scoping review shares only few references with the other 2 (in detail: 11 out of 66 references are identical with references used in Johns et al [<xref ref-type="bibr" rid="ref95">95</xref>] and 2 references are identical with those used in Sembay et al [<xref ref-type="bibr" rid="ref92">92</xref>]). Therefore, all 4 reviews examine different research results and focus on other aspects. Ahmed et al [<xref ref-type="bibr" rid="ref94">94</xref>] did not provide the list of the selected 59 articles.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>This work applied a rigorous scoping review methodology using the framework developed by Arksey and O’Malley [<xref ref-type="bibr" rid="ref16">16</xref>]. All screening stages were carried out by at least 2 independent reviews of 4 members. A previously published protocol [<xref ref-type="bibr" rid="ref17">17</xref>] guided our review. The fact that the scoping review includes comprehensive results for the 5 related RQs and a road map for a tailor-made Provenance-SFL framework with many additional results as supplements can be considered a strength of this review. The criteria for categorization of provenance impact, requirements, and challenge classes were identified qualitatively in peer review.</p>
        <p>One limitation may be because we excluded gray literature from our analysis.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In this paper, we highlighted various approaches and criteria for provenance tracking together with their referenced artifacts, and we developed a road map for a tailor-made Provenance-SFL framework.</p>
        <p>Provenance capture benefits all stakeholders involved in data processing, but it is associated with manifold and individual challenges during design, implementation, and the active use scenario phase.</p>
        <p>Sophisticated data management planning, documentation, metadata expression, and automation along the sensitive data-processing pipelines need to be scrutinized and implemented throughout the data life cycle and in adherence to the underlying infrastructure condition. With rising data volumes and the legal and scientific demands, there is an urgent need for greater transparency in implementing provenance systems in research projects, despite the challenges of unresolved granularity and knowledge bottlenecks. In addition, the roles and responsibilities of a data stewardship escorting the data should be expressed in this context and intensive training and education measures should be put in place. Guidance and recommendations are requested to provide the systematic measurement of provenance and calls for defining a minimal or gold standard. Governance for good data management and scale-up of good data management capabilities matter in this regard.</p>
        <p>The mentioned artifacts, particularly those related to quality aspects, can be seen as transition points resulting from incomplete preliminary work. Therefore, harmonized engineering efforts are now necessary to overcoming the existing hurdles. Awareness of these challenges can facilitate an easier qualified and accurate provenance construction and auditable consumption while enforcing FAIR principles and interoperability standards for data sharing. The effect of provenance for data quality monitoring and the impact of expressive metadata on provenance quality can be considered as open RQs for future work.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Search strings and queries used for database search.</p>
        <media xlink:href="jmir_v26i1e51297_app1.docx" xlink:title="DOCX File , 15 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>PRISMA-ScR (Preferred Reporting Items for Systematic Reviews and Meta-Analyses extension for Scoping Reviews) checklist. Filled-in checklist items for the scoping review.</p>
        <media xlink:href="jmir_v26i1e51297_app2.docx" xlink:title="DOCX File , 84 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Document characteristics of the study corpus. Document characteristics of the study corpus containing presentation of studies between 2006 and 2022 and allocation to the target domain.</p>
        <media xlink:href="jmir_v26i1e51297_app3.docx" xlink:title="DOCX File , 76 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Studies and their respective assignment to a framework type. Framework types are displayed by categories and characteristics of provenance. “Framework—practical provenance management” comprises practical efforts for development and implementation of a provenance approach. “Framework—theoretical provenance management” approach includes ideas and generic principles for provenance consideration.</p>
        <media xlink:href="jmir_v26i1e51297_app4.docx" xlink:title="DOCX File , 83 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Included articles and their related model. Included articles grouped by their related model respectively by using similar approaches. Counts for categories and subcategories are given per model group and approach.</p>
        <media xlink:href="jmir_v26i1e51297_app5.docx" xlink:title="DOCX File , 16 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Reported requirements or factors for provenance. Studies cited to classification, description, and counting of requirement or factor terms.</p>
        <media xlink:href="jmir_v26i1e51297_app6.docx" xlink:title="DOCX File , 20 KB"/>
      </supplementary-material>
      <supplementary-material id="app7">
        <label>Multimedia Appendix 7</label>
        <p>Reported impacts and stakeholders of provenance information. Included articles and counting of impacts per category; shows the structure and relationship between the individual stakeholders and the reported impacts. The comprehensive meaning of the impact is explained in the column “Description” by the assignment of the individual statements from the mentioned papers.</p>
        <media xlink:href="jmir_v26i1e51297_app7.docx" xlink:title="DOCX File , 26 KB"/>
      </supplementary-material>
      <supplementary-material id="app8">
        <label>Multimedia Appendix 8</label>
        <p>Reported technical and organizational challenges. Included articles and counting per category and subcategory for reported challenges, problems, and bottlenecks during accomplishment of provenance.</p>
        <media xlink:href="jmir_v26i1e51297_app8.docx" xlink:title="DOCX File , 31 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">FAIR</term>
          <def>
            <p>findable, accessible, interoperable, reusable</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ISO</term>
          <def>
            <p>International Organization for Standardization</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">OPM</term>
          <def>
            <p>Open Provenance Model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">PRISMA</term>
          <def>
            <p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">PRISMA-ScR</term>
          <def>
            <p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses Extension for Scoping Reviews</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">RQ</term>
          <def>
            <p>research question</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">SFL</term>
          <def>
            <p>Software Framework Life Cycle</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">W3C</term>
          <def>
            <p>World Wide Web Consortium</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This research is funded by the German Federal Ministry of Education and Research within the German Medical Informatics Initiative with the grant 01ZZ1801E (Medical Informatics in Research and Care in University Medicine), by the Deutsche Forschungsgemeinschaft (DFG, German Research Foundation) SFB 1270/2-99150580, and by the National Research Data Infrastructure for Personal Health Data (NFDI4Health) DFG-funded project (Project 442326535). For the publication fee, the authors would like to acknowledge financial support by Heidelberg University.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>All data generated or analyzed during this study are included in this published manuscript and its supplementary information files.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>KG contributed substantially to the conception, design, screening, data extraction, data charting, graphical representation, data analysis and interpretation, drafting all sections of the manuscript, coordinated reviewing, incorporating the comments from the coauthors, and submitting the paper. FK contributed to the discussion of the concept, screening, data extraction, data charting, and finalization of the manuscript and presented the graphical analysis of the extracted data. SG and FH contributed to data extraction and screening. FS contributed to finalization of manuscript. DW contributed to the discussion of the concept, partial screening, editorial revision, and finalization of the manuscript. AAZ contributed to the discussion of the concept, partial data analysis, screening, data extraction, data charting, editorial revision, and finalization of the manuscript. TG contributed to the discussion of the concept and finalization of the manuscript.</p>
        <p>All authors reviewed and approved the submitted version of the manuscript. They agreed both to be personally accountable for the author’s contributions and ensured that questions related to the accuracy or integrity of any part of the work, even ones in which the author was not personally involved, are appropriately investigated, resolved, and the resolution documented in the literature.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Curcin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Miles</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Danger</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bache</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Taweel</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Implementing interoperable provenance in biomedical research</article-title>
          <source>Future Gener Comput Syst</source>
          <year>2014</year>
          <month>05</month>
          <volume>34</volume>
          <fpage>1</fpage>
          <lpage>16</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2013.12.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jayapandian</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ewing</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>GQ</given-names>
            </name>
            <name name-style="western">
              <surname>Sahoo</surname>
              <given-names>SS</given-names>
            </name>
          </person-group>
          <article-title>A semantic proteomics dashboard (SemPoD) for data management in translational research</article-title>
          <source>BMC Syst Biol</source>
          <year>2012</year>
          <month>12</month>
          <day>17</day>
          <volume>6</volume>
          <issue>S3</issue>
          <fpage>S20</fpage>
          <pub-id pub-id-type="doi">10.1186/1752-0509-6-s3-s20</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cuggia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Combes</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The French health data hub and the German medical informatics initiatives: two national projects to promote data sharing in healthcare</article-title>
          <source>Yearb Med Inform</source>
          <year>2019</year>
          <month>08</month>
          <day>16</day>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>195</fpage>
          <lpage>202</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.1055/s-0039-1677917"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/s-0039-1677917</pub-id>
          <pub-id pub-id-type="medline">31419832</pub-id>
          <pub-id pub-id-type="pmcid">PMC6697511</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Curcin</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Embedding data provenance into the learning health system to facilitate reproducible research</article-title>
          <source>Learn Health Syst</source>
          <year>2017</year>
          <month>04</month>
          <day>27</day>
          <volume>1</volume>
          <issue>2</issue>
          <fpage>e10019</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31245557"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/lrh2.10019</pub-id>
          <pub-id pub-id-type="medline">31245557</pub-id>
          <pub-id pub-id-type="pii">LRH210019</pub-id>
          <pub-id pub-id-type="pmcid">PMC6516719</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wodke</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Michaelis</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Henkel</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>The MeDaX knowledge graph prototype</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2023</year>
          <month>05</month>
          <day>18</day>
          <volume>302</volume>
          <fpage>147</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.3233/SHTI230089</pub-id>
          <pub-id pub-id-type="medline">37203634</pub-id>
          <pub-id pub-id-type="pii">SHTI230089</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schröder</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Staehlke</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Groth</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Nebe</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Spors</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Krüger</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Structure-based knowledge acquisition from electronic lab notebooks for research data provenance documentation</article-title>
          <source>J Biomed Semantics</source>
          <year>2022</year>
          <month>01</month>
          <day>31</day>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>4</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jbiomedsem.biomedcentral.com/articles/10.1186/s13326-021-00257-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13326-021-00257-x</pub-id>
          <pub-id pub-id-type="medline">35101121</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13326-021-00257-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC8802522</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Kamineni</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fuller</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Olmstead</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wernli</surname>
              <given-names>KJ</given-names>
            </name>
          </person-group>
          <article-title>How the provenance of electronic health record data matters for research: a case example using system mapping</article-title>
          <source>EGEMS (Wash DC)</source>
          <year>2014</year>
          <month>04</month>
          <day>16</day>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>1058</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25821838"/>
          </comment>
          <pub-id pub-id-type="doi">10.13063/2327-9214.1058</pub-id>
          <pub-id pub-id-type="medline">25821838</pub-id>
          <pub-id pub-id-type="pii">egems1058</pub-id>
          <pub-id pub-id-type="pmcid">PMC4371416</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <article-title>PROV-overview</article-title>
          <source>World Wide Web Consortium</source>
          <access-date>2024-03-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.w3.org/TR/prov-overview/">https://www.w3.org/TR/prov-overview/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilkinson</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Dumontier</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Aalbersberg</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Appleton</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Axton</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Baak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Blomberg</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Boiten</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>da Silva Santos</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>Bourne</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Bouwman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Brookes</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Crosas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dillo</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Dumon</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Edmunds</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Evelo</surname>
              <given-names>CT</given-names>
            </name>
            <name name-style="western">
              <surname>Finkers</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez-Beltran</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gray</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Groth</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Goble</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Grethe</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Heringa</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>'t Hoen</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Hooft</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kuhn</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kok</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kok</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lusher</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Martone</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Mons</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Packer</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Persson</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Rocca-Serra</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Roos</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>van Schaik</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sansone</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Schultes</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sengstag</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Slater</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Strawn</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Swertz</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>van der Lei</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>van Mulligen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Velterop</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Waagmeester</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wittenburg</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wolstencroft</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mons</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>The FAIR Guiding Principles for scientific data management and stewardship</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <month>03</month>
          <day>15</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>160018</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/sdata.2016.18"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.18</pub-id>
          <pub-id pub-id-type="medline">26978244</pub-id>
          <pub-id pub-id-type="pii">sdata201618</pub-id>
          <pub-id pub-id-type="pmcid">PMC4792175</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Inau</surname>
              <given-names>ET</given-names>
            </name>
            <name name-style="western">
              <surname>Sack</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Waltemath</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zeleke</surname>
              <given-names>AA</given-names>
            </name>
          </person-group>
          <article-title>Initiatives, concepts, and implementation practices of FAIR (findable, accessible, interoperable, and reusable) data principles in health data stewardship practice: protocol for a scoping review</article-title>
          <source>JMIR Res Protoc</source>
          <year>2021</year>
          <month>03</month>
          <day>02</day>
          <volume>10</volume>
          <issue>2</issue>
          <fpage>e22505</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchprotocols.org/2021/2/e22505/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/22505</pub-id>
          <pub-id pub-id-type="medline">33528373</pub-id>
          <pub-id pub-id-type="pii">v10i2e22505</pub-id>
          <pub-id pub-id-type="pmcid">PMC7886612</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jauer</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Deserno</surname>
              <given-names>TM</given-names>
            </name>
          </person-group>
          <article-title>Data provenance standards and recommendations for FAIR data</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2020</year>
          <month>06</month>
          <day>16</day>
          <volume>270</volume>
          <fpage>1237</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.3233/SHTI200380</pub-id>
          <pub-id pub-id-type="medline">32570597</pub-id>
          <pub-id pub-id-type="pii">SHTI200380</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hume</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sarnikar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Noteboom</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Enhancing traceability in clinical research data through a metadata framework</article-title>
          <source>Methods Inf Med</source>
          <year>2020</year>
          <month>05</month>
          <day>07</day>
          <volume>59</volume>
          <issue>2-03</issue>
          <fpage>75</fpage>
          <lpage>85</lpage>
          <pub-id pub-id-type="doi">10.1055/s-0040-1714393</pub-id>
          <pub-id pub-id-type="medline">32894879</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sahoo</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Bodenreider</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Parikh</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Minning</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sheth</surname>
              <given-names>AP</given-names>
            </name>
          </person-group>
          <article-title>A unified framework for managing provenance information in translational research</article-title>
          <source>BMC Bioinformatics</source>
          <year>2011</year>
          <month>11</month>
          <day>29</day>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>461</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-12-461"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2105-12-461</pub-id>
          <pub-id pub-id-type="medline">22126369</pub-id>
          <pub-id pub-id-type="pii">1471-2105-12-461</pub-id>
          <pub-id pub-id-type="pmcid">PMC3298549</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yakutovich</surname>
              <given-names>AV</given-names>
            </name>
            <name name-style="western">
              <surname>Eimre</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Schütt</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Talirz</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Adorf</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Andersen</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Ditler</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Passerone</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Smit</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Marzari</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Pizzi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Pignedoli</surname>
              <given-names>CA</given-names>
            </name>
          </person-group>
          <article-title>AiiDAlab – an ecosystem for developing, executing, and sharing scientific workflows</article-title>
          <source>Comput Mater Sci</source>
          <year>2021</year>
          <month>02</month>
          <volume>188</volume>
          <fpage>110165</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.commatsci.2020.110165"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.commatsci.2020.110165</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schissel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Abla</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Flanagan</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Greenwald</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Romosan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shoshani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stillerman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Automated metadata, provenance cataloging and navigable interfaces: ensuring the usefulness of extreme-scale data</article-title>
          <source>Fusion Eng Des</source>
          <year>2014</year>
          <month>05</month>
          <volume>89</volume>
          <issue>5</issue>
          <fpage>745</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.fusengdes.2014.01.053</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arksey</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>O'Malley</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Scoping studies: towards a methodological framework</article-title>
          <source>Int J Soc Res Methodol</source>
          <year>2005</year>
          <month>02</month>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>19</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1080/1364557032000119616</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gierend</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Krüger</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Waltemath</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Fünfgeld</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ganslandt</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zeleke</surname>
              <given-names>AA</given-names>
            </name>
          </person-group>
          <article-title>Approaches and criteria for provenance in biomedical data sets and workflows: protocol for a scoping review</article-title>
          <source>JMIR Res Protoc</source>
          <year>2021</year>
          <month>11</month>
          <day>22</day>
          <volume>10</volume>
          <issue>11</issue>
          <fpage>e31750</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchprotocols.org/2021/11/e31750/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/31750</pub-id>
          <pub-id pub-id-type="medline">34813494</pub-id>
          <pub-id pub-id-type="pii">v10i11e31750</pub-id>
          <pub-id pub-id-type="pmcid">PMC8663663</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Braun</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Using thematic analysis in psychology</article-title>
          <source>Qual Res Psychol</source>
          <year>2006</year>
          <month>01</month>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>77</fpage>
          <lpage>101</lpage>
          <pub-id pub-id-type="doi">10.1191/1478088706qp063oa</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ouzzani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hammady</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Fedorowicz</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Elmagarmid</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Rayyan-a web and mobile app for systematic reviews</article-title>
          <source>Syst Rev</source>
          <year>2016</year>
          <month>12</month>
          <day>05</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>210</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://systematicreviewsjournal.biomedcentral.com/articles/10.1186/s13643-016-0384-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13643-016-0384-4</pub-id>
          <pub-id pub-id-type="medline">27919275</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13643-016-0384-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC5139140</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Van Rossum</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Drake</surname>
              <given-names>FL</given-names>
            </name>
          </person-group>
          <source>Python 3 Reference Manual</source>
          <year>2009</year>
          <publisher-loc>Scotts Valley, CA</publisher-loc>
          <publisher-name>CreateSpace</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>R Core Team</collab>
          </person-group>
          <article-title>The R project for statistical computing</article-title>
          <source>R Foundation for Statistical Computing</source>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.r-project.org/">https://www.r-project.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wickham</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Averick</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bryan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>McGowan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>François</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Grolemund</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hayes</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Henry</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hester</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kuhn</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pedersen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bache</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ooms</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Seidel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Spinu</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Vaughan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wilke</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Woo</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yutani</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Welcome to the Tidyverse</article-title>
          <source>J Open Source Softw</source>
          <year>2019</year>
          <month>11</month>
          <volume>4</volume>
          <issue>43</issue>
          <fpage>1686</fpage>
          <pub-id pub-id-type="doi">10.21105/joss.01686</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tricco</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Lillie</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zarin</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>O'Brien</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Colquhoun</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Levac</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Horsley</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Weeks</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hempel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Akl</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>McGowan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hartling</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Aldcroft</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Garritty</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lewin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Godfrey</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Macdonald</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Langlois</surname>
              <given-names>EV</given-names>
            </name>
            <name name-style="western">
              <surname>Soares-Weiser</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Moriarty</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Clifford</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tunçalp</surname>
              <given-names>Ö</given-names>
            </name>
            <name name-style="western">
              <surname>Straus</surname>
              <given-names>SE</given-names>
            </name>
          </person-group>
          <article-title>PRISMA extension for scoping reviews (PRISMA-ScR): checklist and explanation</article-title>
          <source>Ann Intern Med</source>
          <year>2018</year>
          <month>10</month>
          <day>02</day>
          <volume>169</volume>
          <issue>7</issue>
          <fpage>467</fpage>
          <lpage>73</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.acpjournals.org/doi/abs/10.7326/M18-0850?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.7326/M18-0850</pub-id>
          <pub-id pub-id-type="medline">30178033</pub-id>
          <pub-id pub-id-type="pii">2700389</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Page</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>McKenzie</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Bossuyt</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Boutron</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffmann</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Mulrow</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Shamseer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tetzlaff</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Akl</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Glanville</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Grimshaw</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Hróbjartsson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lalu</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Loder</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Mayo-Wilson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>McDonald</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McGuinness</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tricco</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Welch</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Whiting</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The PRISMA 2020 statement: an updated guideline for reporting systematic reviews</article-title>
          <source>BMJ</source>
          <year>2021</year>
          <month>03</month>
          <day>29</day>
          <volume>372</volume>
          <fpage>n71</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/lookup/pmidlookup?view=long&#38;pmid=33782057"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.n71</pub-id>
          <pub-id pub-id-type="medline">33782057</pub-id>
          <pub-id pub-id-type="pmcid">PMC8005924</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Daumke</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Heitmann</surname>
              <given-names>KU</given-names>
            </name>
            <name name-style="western">
              <surname>Heckmann</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez-Costa</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schulz</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Clinical text mining on FHIR</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2019</year>
          <month>08</month>
          <day>21</day>
          <volume>264</volume>
          <fpage>83</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.3233/SHTI190188</pub-id>
          <pub-id pub-id-type="medline">31437890</pub-id>
          <pub-id pub-id-type="pii">SHTI190188</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Parciak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bauer</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bender</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lodahl</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Schreiweis</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tute</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sax</surname>
              <given-names>U</given-names>
            </name>
          </person-group>
          <article-title>Provenance solutions for medical research in heterogeneous IT-infrastructure: an implementation roadmap</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2019</year>
          <month>08</month>
          <day>21</day>
          <volume>264</volume>
          <fpage>298</fpage>
          <lpage>302</lpage>
          <pub-id pub-id-type="doi">10.3233/SHTI190231</pub-id>
          <pub-id pub-id-type="medline">31437933</pub-id>
          <pub-id pub-id-type="pii">SHTI190231</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mondelli</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Magalhães</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Loss</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wilde</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Foster</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Mattoso</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Katz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Barbosa</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>de Vasconcelos</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Ocaña</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gadelha</surname>
              <given-names>LM</given-names>
            </name>
          </person-group>
          <article-title>BioWorkbench: a high-performance framework for managing and analyzing bioinformatics experiments</article-title>
          <source>PeerJ</source>
          <year>2018</year>
          <volume>6</volume>
          <fpage>e5551</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30186700"/>
          </comment>
          <pub-id pub-id-type="doi">10.7717/peerj.5551</pub-id>
          <pub-id pub-id-type="medline">30186700</pub-id>
          <pub-id pub-id-type="pii">5551</pub-id>
          <pub-id pub-id-type="pmcid">PMC6119457</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Keator</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Helmer</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Steffener</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Turner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Van Erp</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gadde</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ashish</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Burns</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Nichols</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Towards structured sharing of raw and derived neuroimaging data across existing resources</article-title>
          <source>Neuroimage</source>
          <year>2013</year>
          <month>11</month>
          <day>15</day>
          <volume>82</volume>
          <fpage>647</fpage>
          <lpage>61</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23727024"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.neuroimage.2013.05.094</pub-id>
          <pub-id pub-id-type="medline">23727024</pub-id>
          <pub-id pub-id-type="pii">S1053-8119(13)00596-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC4028152</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Celebi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rebelo Moreira</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hassan</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Ayyar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ridder</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kuhn</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dumontier</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Towards FAIR protocols and workflows: the OpenPREDICT use case</article-title>
          <source>PeerJ Comput Sci</source>
          <year>2020</year>
          <volume>6</volume>
          <fpage>e281</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33816932"/>
          </comment>
          <pub-id pub-id-type="doi">10.7717/peerj-cs.281</pub-id>
          <pub-id pub-id-type="medline">33816932</pub-id>
          <pub-id pub-id-type="pii">cs-281</pub-id>
          <pub-id pub-id-type="pmcid">PMC7924452</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pimentel</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Freire</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Murta</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Braganholo</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>A survey on collecting, managing, and analyzing provenance from scripts</article-title>
          <source>ACM Comput Surv</source>
          <year>2019</year>
          <month>06</month>
          <day>18</day>
          <volume>52</volume>
          <issue>3</issue>
          <fpage>1</fpage>
          <lpage>38</lpage>
          <pub-id pub-id-type="doi">10.1145/3311955</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bánáti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kacsuk</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kozlovszky</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Reproducibility analysis of scientific workflows</article-title>
          <source>Acta polytech Hung</source>
          <year>2017</year>
          <month>05</month>
          <day>03</day>
          <volume>14</volume>
          <issue>2</issue>
          <fpage>17</fpage>
          <pub-id pub-id-type="doi">10.12700/aph.14.2.2017.2.11</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bechhofer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Buchan</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>De Roure</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Missier</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ainsworth</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bhagat</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Couch</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Cruickshank</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Delderfield</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dunlop</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Gamble</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Michaelides</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Owen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Newman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sufi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Goble</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Why linked data is not enough for scientists</article-title>
          <source>Future Gener Comput Syst</source>
          <year>2013</year>
          <month>02</month>
          <volume>29</volume>
          <issue>2</issue>
          <fpage>599</fpage>
          <lpage>611</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2011.08.004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Groth</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Moreau</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Representing distributed systems using the open provenance model</article-title>
          <source>Future Gener Comput Syst</source>
          <year>2011</year>
          <month>6</month>
          <volume>27</volume>
          <issue>6</issue>
          <fpage>757</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2010.10.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Golbeck</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hendler</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A Semantic web approach to the provenance challenge</article-title>
          <source>Concurr Comput</source>
          <year>2008</year>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>431</fpage>
          <lpage>439</lpage>
          <pub-id pub-id-type="doi">10.1002/cpe.1238</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schuchardt</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Gibson</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Stephan</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chin</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Applying content management to automated provenance capture</article-title>
          <source>Concurr Comput</source>
          <year>2008</year>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>541</fpage>
          <lpage>54</lpage>
          <pub-id pub-id-type="doi">10.1002/cpe.1230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Danese</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Halperin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Duryea</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Duryea</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>The generalized data model for clinical research</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2019</year>
          <month>06</month>
          <day>24</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>117</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-019-0837-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-019-0837-5</pub-id>
          <pub-id pub-id-type="medline">31234921</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-019-0837-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC6591926</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tyndall</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tyndall</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>FHIR healthcare directories: adopting shared interfaces to achieve interoperable medical device data integration</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2018</year>
          <volume>249</volume>
          <fpage>181</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="medline">29866978</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sahoo</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Valdez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rueschman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Redline</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>ProvCaRe: characterizing scientific reproducibility of biomedical research studies using semantic provenance metadata</article-title>
          <source>Int J Med Inform</source>
          <year>2019</year>
          <month>01</month>
          <volume>121</volume>
          <fpage>10</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30545485"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2018.10.009</pub-id>
          <pub-id pub-id-type="medline">30545485</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(18)30269-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC6343667</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fairweather</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Glenn</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Curran</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Curcin</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Application of data provenance in healthcare analytics software: information visualisation of user activities</article-title>
          <source>AMIA Jt Summits Transl Sci Proc</source>
          <year>2018</year>
          <volume>2017</volume>
          <fpage>263</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29888084"/>
          </comment>
          <pub-id pub-id-type="medline">29888084</pub-id>
          <pub-id pub-id-type="pmcid">PMC5961786</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huber</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Zoupanos</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Uhrin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Talirz</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kahle</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Häuselmann</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gresch</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yakutovich</surname>
              <given-names>AV</given-names>
            </name>
            <name name-style="western">
              <surname>Andersen</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Ramirez</surname>
              <given-names>FF</given-names>
            </name>
            <name name-style="western">
              <surname>Adorf</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Gargiulo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kumbhar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Passaro</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Johnston</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Merkys</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cepellotti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mounet</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Marzari</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kozinsky</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Pizzi</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>AiiDA 1.0, a scalable computational infrastructure for automated reproducible workflows and data provenance</article-title>
          <source>Sci Data</source>
          <year>2020</year>
          <month>09</month>
          <day>08</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>300</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41597-020-00638-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-020-00638-4</pub-id>
          <pub-id pub-id-type="medline">32901044</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-020-00638-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC7479590</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Madougou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Santcroos</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Benabdelkader</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>van Schaik</surname>
              <given-names>BD</given-names>
            </name>
            <name name-style="western">
              <surname>Shahand</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Korkhov</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>van Kampen</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Olabarriaga</surname>
              <given-names>SD</given-names>
            </name>
          </person-group>
          <article-title>Provenance for distributed biomedical workflow execution</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2012</year>
          <volume>175</volume>
          <fpage>91</fpage>
          <lpage>100</lpage>
          <pub-id pub-id-type="medline">22941992</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guedes</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Martins</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>Falci</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Silva</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Ocaña</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Mattoso</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bedo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>de Oliveira</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Capturing and analyzing provenance from spark-based scientific workflows with SAMbA-RaP</article-title>
          <source>Future Gener Comput Syst</source>
          <year>2020</year>
          <month>11</month>
          <volume>112</volume>
          <fpage>658</fpage>
          <lpage>69</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2020.05.031</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thavasimani</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Cala</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Missier</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Why-diff: exploiting provenance to understand outcome differences from non-identical reproduced workflows</article-title>
          <source>IEEE Access</source>
          <year>2019</year>
          <volume>7</volume>
          <fpage>34973</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2019.2903727</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marinho</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>de Oliveira</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ogasawara</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Silva</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Ocaña</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Murta</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Braganholo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Mattoso</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Deriving scientific workflows from algebraic experiment lines: a practical approach</article-title>
          <source>Future Gener Comput Syst</source>
          <year>2017</year>
          <month>03</month>
          <volume>68</volume>
          <fpage>111</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2016.08.016</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Danger</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Curcin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Missier</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bryans</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Access control and view generation for provenance graphs</article-title>
          <source>Future Gener Comput Syst</source>
          <year>2015</year>
          <month>08</month>
          <volume>49</volume>
          <fpage>8</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2015.01.014</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moreau</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Provenance-based reproducibility in the Semantic Web</article-title>
          <source>J Web Semant</source>
          <year>2011</year>
          <month>07</month>
          <volume>9</volume>
          <issue>2</issue>
          <fpage>202</fpage>
          <lpage>21</lpage>
          <pub-id pub-id-type="doi">10.1016/j.websem.2011.03.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Holland</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Seltzer</surname>
              <given-names>MI</given-names>
            </name>
            <name name-style="western">
              <surname>Braun</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Muniswamy‐Reddy</surname>
              <given-names>KK</given-names>
            </name>
          </person-group>
          <article-title>PASSing the provenance challenge</article-title>
          <source>Concurr Comput</source>
          <year>2008</year>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>531</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1002/cpe.1227</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Margheri</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Masi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Miladi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sassone</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenzweig</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Decentralised provenance for healthcare data</article-title>
          <source>Int J Med Inform</source>
          <year>2020</year>
          <month>09</month>
          <volume>141</volume>
          <fpage>104197</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2020.104197</pub-id>
          <pub-id pub-id-type="medline">32540775</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(19)31203-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sahoo</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Valdez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rueschman</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Scientific reproducibility in biomedical research: provenance metadata ontology for semantic annotation of study description</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>1070</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28269904"/>
          </comment>
          <pub-id pub-id-type="medline">28269904</pub-id>
          <pub-id pub-id-type="pmcid">PMC5333253</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Curcin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Soljak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Majeed</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Managing and exploiting routinely collected NHS data for research</article-title>
          <source>Inform Prim Care</source>
          <year>2013</year>
          <volume>20</volume>
          <issue>4</issue>
          <fpage>225</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://hijournal.bcs.org/index.php/jhi/article/view/1"/>
          </comment>
          <pub-id pub-id-type="doi">10.14236/jhi.v20i4.1</pub-id>
          <pub-id pub-id-type="medline">23890333</pub-id>
          <pub-id pub-id-type="pii">1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Razick</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Močnik</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>LF</given-names>
            </name>
            <name name-style="western">
              <surname>Ryeng</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Drabløs</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Sætrom</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>The eGenVar data management system--cataloguing and sharing sensitive data and metadata for the life sciences</article-title>
          <source>Database (Oxford)</source>
          <year>2014</year>
          <volume>2014</volume>
          <fpage>bau027</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24682735"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/database/bau027</pub-id>
          <pub-id pub-id-type="medline">24682735</pub-id>
          <pub-id pub-id-type="pii">bau027</pub-id>
          <pub-id pub-id-type="pmcid">PMC4030636</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saccone</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Quan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>PL</given-names>
            </name>
          </person-group>
          <article-title>BioQ: tracing experimental origins in public genomic databases using a novel data provenance model</article-title>
          <source>Bioinformatics</source>
          <year>2012</year>
          <month>04</month>
          <day>15</day>
          <volume>28</volume>
          <issue>8</issue>
          <fpage>1189</fpage>
          <lpage>91</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22426342"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/bts117</pub-id>
          <pub-id pub-id-type="medline">22426342</pub-id>
          <pub-id pub-id-type="pii">bts117</pub-id>
          <pub-id pub-id-type="pmcid">PMC3324523</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Woodman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hiden</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Watson</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Applications of provenance in performance prediction and data storage optimisation</article-title>
          <source>Future Gener Comput Syst</source>
          <year>2017</year>
          <month>10</month>
          <volume>75</volume>
          <fpage>299</fpage>
          <lpage>309</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2017.01.003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marinho</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Murta</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Werner</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Braganholo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Cruz</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Ogasawara</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Mattoso</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>ProvManager: a provenance management system for scientific workflows</article-title>
          <source>Concurr Comput</source>
          <year>2012</year>
          <volume>24</volume>
          <issue>13</issue>
          <fpage>1513</fpage>
          <lpage>30</lpage>
          <pub-id pub-id-type="doi">10.1002/cpe.1870</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bowers</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McPhillips</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Ludäscher</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Provenance in collection‐oriented scientific workflows</article-title>
          <source>Concurr Comput</source>
          <year>2008</year>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>519</fpage>
          <lpage>29</lpage>
          <pub-id pub-id-type="doi">10.1002/cpe.1226</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Can</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Yilmazer</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A novel approach to provenance management for privacy preservation</article-title>
          <source>J Inf Sci</source>
          <year>2020</year>
          <volume>46</volume>
          <issue>2</issue>
          <fpage>147</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1177/0165551519827882</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Curcin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Fairweather</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Danger</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Corrigan</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Templates as a method for implementing data provenance in decision support systems</article-title>
          <source>J Biomed Inform</source>
          <year>2017</year>
          <month>01</month>
          <volume>65</volume>
          <fpage>1</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(16)30159-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2016.10.022</pub-id>
          <pub-id pub-id-type="medline">27856379</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(16)30159-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>FZ</given-names>
            </name>
            <name name-style="western">
              <surname>Soiland-Reyes</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sinnott</surname>
              <given-names>RO</given-names>
            </name>
            <name name-style="western">
              <surname>Lonie</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Goble</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Crusoe</surname>
              <given-names>MR</given-names>
            </name>
          </person-group>
          <article-title>Sharing interoperable workflow provenance: a review of best practices and their practical application in CWLProv</article-title>
          <source>Gigascience</source>
          <year>2019</year>
          <month>11</month>
          <day>01</day>
          <volume>8</volume>
          <issue>11</issue>
          <fpage>giz095</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31675414"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/gigascience/giz095</pub-id>
          <pub-id pub-id-type="medline">31675414</pub-id>
          <pub-id pub-id-type="pii">5611001</pub-id>
          <pub-id pub-id-type="pmcid">PMC6824458</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ciccarese</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Soiland-Reyes</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Belhajjame</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gray</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Goble</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>PAV ontology: provenance, authoring and versioning</article-title>
          <source>J Biomed Semantics</source>
          <year>2013</year>
          <month>11</month>
          <day>22</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>37</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jbiomedsem.biomedcentral.com/articles/10.1186/2041-1480-4-37"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/2041-1480-4-37</pub-id>
          <pub-id pub-id-type="medline">24267948</pub-id>
          <pub-id pub-id-type="pii">2041-1480-4-37</pub-id>
          <pub-id pub-id-type="pmcid">PMC4177195</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alterovitz</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Goble</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Crusoe</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Soiland-Reyes</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hayes</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Suresh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Purkayastha</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Johanson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>EE</given-names>
            </name>
            <name name-style="western">
              <surname>Donaldson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Morizono</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tsang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Vora</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Goecks</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Almeida</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Keeney</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Addepalli</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Krampis</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Walderhaug</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schito</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ezewudo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Guimera</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Walsh</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kahsay</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gottipati</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rodwell</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Bloom</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Simonyan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Mazumder</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Enabling precision medicine via standard communication of HTS provenance, analysis, and results</article-title>
          <source>PLoS Biol</source>
          <year>2018</year>
          <month>12</month>
          <day>31</day>
          <volume>16</volume>
          <issue>12</issue>
          <fpage>e3000099</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pbio.3000099"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pbio.3000099</pub-id>
          <pub-id pub-id-type="medline">30596645</pub-id>
          <pub-id pub-id-type="pii">PBIOLOGY-D-18-01024</pub-id>
          <pub-id pub-id-type="pmcid">PMC6338479</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arshad</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Munir</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>McClatchey</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shamdasani</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>NeuroProv: Provenance data visualisation for neuroimaging analyses</article-title>
          <source>J Comput Lang</source>
          <year>2019</year>
          <month>06</month>
          <volume>52</volume>
          <fpage>72</fpage>
          <lpage>87</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.cola.2019.04.004"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cola.2019.04.004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stitz</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Luger</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Streit</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gehlenborg</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>AVOCADO: visualization of workflow-derived data provenance for reproducible biomedical research</article-title>
          <source>Comput Graph Forum</source>
          <year>2016</year>
          <month>06</month>
          <day>04</day>
          <volume>35</volume>
          <issue>3</issue>
          <fpage>481</fpage>
          <lpage>90</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29973745"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/cgf.12924</pub-id>
          <pub-id pub-id-type="medline">29973745</pub-id>
          <pub-id pub-id-type="pmcid">PMC6027754</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sahoo</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Bodenreider</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Hitzler</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sheth</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thirunarayan</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Provenance context entity (PaCE): scalable provenance tracking for scientific RDF data</article-title>
          <source>Proceedings of the 22nd International Conference on Scientific and Statistical Database Management</source>
          <year>2010</year>
          <conf-name>SSDBM '10</conf-name>
          <conf-date>June 30-July 2, 2010</conf-date>
          <conf-loc>Heidelberg, Germany</conf-loc>
          <fpage>461</fpage>
          <lpage>70</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://link.springer.com/chapter/10.1007/978-3-642-13818-8_32"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/978-3-642-13818-8_32</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McClatchey</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Branson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Anjum</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bloodsworth</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Habib</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Munir</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Shamdasani</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Soomro</surname>
              <given-names>K</given-names>
            </name>
            <collab>neuGRID Consortium</collab>
          </person-group>
          <article-title>Providing traceability for neuroimaging analyses</article-title>
          <source>Int J Med Inform</source>
          <year>2013</year>
          <month>09</month>
          <volume>82</volume>
          <issue>9</issue>
          <fpage>882</fpage>
          <lpage>94</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2013.05.005</pub-id>
          <pub-id pub-id-type="medline">23763909</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(13)00111-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Monnin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Legrand</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Husson</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ringot</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tchechmedjiev</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jonquet</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Napoli</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Coulet</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>PGxO and PGxLOD: a reconciliation of pharmacogenomic knowledge of various provenances, enabling further comparison</article-title>
          <source>BMC Bioinformatics</source>
          <year>2019</year>
          <month>04</month>
          <day>18</day>
          <volume>20</volume>
          <issue>Suppl 4</issue>
          <fpage>139</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/s12859-019-2693-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12859-019-2693-9</pub-id>
          <pub-id pub-id-type="medline">30999867</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12859-019-2693-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC6471679</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ornelas</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Braga</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>David</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Campos</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Castro</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Provenance data discovery through semantic web resources</article-title>
          <source>Concurr Comput</source>
          <year>2018</year>
          <volume>30</volume>
          <issue>6</issue>
          <fpage>e4366</fpage>
          <pub-id pub-id-type="doi">10.1002/cpe.4366</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Madougou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shahand</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Santcroos</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>van Schaik</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Benabdelkader</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>van Kampen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Olabarriaga</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Characterizing workflow-based activity on a production e-infrastructure using provenance data</article-title>
          <source>Future Gener Comput Syst</source>
          <year>2013</year>
          <month>10</month>
          <volume>29</volume>
          <issue>8</issue>
          <fpage>1931</fpage>
          <lpage>42</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2013.04.019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chebotko</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fotouhi</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Storing, reasoning, and querying OPM-compliant scientific workflow provenance using relational databases</article-title>
          <source>Future Gener Comput Syst</source>
          <year>2011</year>
          <month>6</month>
          <volume>27</volume>
          <issue>6</issue>
          <fpage>781</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2010.10.013</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jennath</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Anoop</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Asharaf</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Blockchain for healthcare: securing patient data and enabling trusted artificial intelligence</article-title>
          <source>Int J Interact Multimed Artif Intell</source>
          <year>2020</year>
          <volume>6</volume>
          <issue>3</issue>
          <fpage>15</fpage>
          <pub-id pub-id-type="doi">10.9781/ijimai.2020.07.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Pizarro</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zoltick</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Weinberger</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Mattay</surname>
              <given-names>VS</given-names>
            </name>
          </person-group>
          <article-title>Bio-swarm-pipeline: a light-weight, extensible batch processing system for efficient biomedical data processing</article-title>
          <source>Front Neuroinform</source>
          <year>2009</year>
          <volume>3</volume>
          <fpage>35</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/19847314"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/neuro.11.035.2009</pub-id>
          <pub-id pub-id-type="medline">19847314</pub-id>
          <pub-id pub-id-type="pmcid">PMC2763889</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jabal</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Bertino</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>A comprehensive query language for provenance information</article-title>
          <source>Int J Coop Info Syst</source>
          <year>2018</year>
          <month>09</month>
          <day>26</day>
          <volume>27</volume>
          <issue>03</issue>
          <fpage>1850007</fpage>
          <pub-id pub-id-type="doi">10.1142/S0218843018500077</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Deelman</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gil</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ratnakar</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Provenance trails in the Wings/Pegasus system</article-title>
          <source>Concurr Comput</source>
          <year>2008</year>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>587</fpage>
          <lpage>97</lpage>
          <pub-id pub-id-type="doi">10.1002/cpe.1228</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chebotko</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fotouhi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kashlev</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>OPQL: querying scientific workflow provenance at the graph level</article-title>
          <source>Data Knowl Eng</source>
          <year>2013</year>
          <month>11</month>
          <volume>88</volume>
          <fpage>37</fpage>
          <lpage>59</lpage>
          <pub-id pub-id-type="doi">10.1016/j.datak.2013.08.008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wittner</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mascia</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gallo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Frexia</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Plass</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Geiger</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Holub</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Lightweight distributed provenance model for complex real-world environments</article-title>
          <source>Sci Data</source>
          <year>2022</year>
          <month>08</month>
          <day>17</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>503</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41597-022-01537-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-022-01537-6</pub-id>
          <pub-id pub-id-type="medline">35977957</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-022-01537-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC9383664</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Samuel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>König-Ries</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>A collaborative semantic-based provenance management platform for reproducibility</article-title>
          <source>PeerJ Comput Sci</source>
          <year>2022</year>
          <volume>8</volume>
          <fpage>e921</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35494870"/>
          </comment>
          <pub-id pub-id-type="doi">10.7717/peerj-cs.921</pub-id>
          <pub-id pub-id-type="medline">35494870</pub-id>
          <pub-id pub-id-type="pii">cs-921</pub-id>
          <pub-id pub-id-type="pmcid">PMC9044346</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yazici</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Aktas</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Yazici</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Aktas</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>A novel visualization approach for data provenance</article-title>
          <source>Concurr Comput</source>
          <year>2022</year>
          <volume>34</volume>
          <issue>9</issue>
          <fpage>4</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1002/cpe.6523</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tsao</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Trellis for efficient data and task management in the VA Million Veteran program</article-title>
          <source>Sci Rep</source>
          <year>2021</year>
          <month>12</month>
          <day>01</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>23229</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-021-02569-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-021-02569-5</pub-id>
          <pub-id pub-id-type="medline">34853358</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-021-02569-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC8636485</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nadendla</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Munro</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Quaglia</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Mészáros</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Olley</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hobbs</surname>
              <given-names>ET</given-names>
            </name>
            <name name-style="western">
              <surname>Goralski</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Chibucos</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mungall</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Tosatto</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Erill</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Giglio</surname>
              <given-names>MG</given-names>
            </name>
          </person-group>
          <article-title>ECO: the evidence and conclusion ontology, an update for 2022</article-title>
          <source>Nucleic Acids Res</source>
          <year>2022</year>
          <month>01</month>
          <day>07</day>
          <volume>50</volume>
          <issue>D1</issue>
          <fpage>D1515</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34986598"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkab1025</pub-id>
          <pub-id pub-id-type="medline">34986598</pub-id>
          <pub-id pub-id-type="pii">6431816</pub-id>
          <pub-id pub-id-type="pmcid">PMC8728134</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Westbrook</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Varki</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>WK</given-names>
            </name>
          </person-group>
          <article-title>RepeatFS: a file system providing reproducibility through provenance and automation</article-title>
          <source>Bioinformatics</source>
          <year>2021</year>
          <month>06</month>
          <day>09</day>
          <volume>37</volume>
          <issue>9</issue>
          <fpage>1292</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33230554"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btaa950</pub-id>
          <pub-id pub-id-type="medline">33230554</pub-id>
          <pub-id pub-id-type="pii">5952659</pub-id>
          <pub-id pub-id-type="pmcid">PMC8189677</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Raboudi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Allanic</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Balvay</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hervé</surname>
              <given-names>PY</given-names>
            </name>
            <name name-style="western">
              <surname>Viel</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yoganathan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Certain</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hilbey</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Charlet</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Durupt</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Boutinaud</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Eynard</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tavitian</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>The BMS-LM ontology for biomedical data reporting throughout the lifecycle of a research study: from data model to ontology</article-title>
          <source>J Biomed Inform</source>
          <year>2022</year>
          <month>03</month>
          <volume>127</volume>
          <fpage>104007</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(22)00023-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2022.104007</pub-id>
          <pub-id pub-id-type="medline">35124236</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(22)00023-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levinson</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Niestroy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Al Manir</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fairchild</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lake</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Moorman</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>FAIRSCAPE: a framework for FAIR and reproducible biomedical analytics</article-title>
          <source>Neuroinformatics</source>
          <year>2021</year>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>187</fpage>
          <lpage>202</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34264488"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s12021-021-09529-4</pub-id>
          <pub-id pub-id-type="medline">34264488</pub-id>
          <pub-id pub-id-type="pii">10.1007/s12021-021-09529-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC8760356</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wagner</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Waite</surname>
              <given-names>LK</given-names>
            </name>
            <name name-style="western">
              <surname>Wierzba</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffstaedter</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Waite</surname>
              <given-names>AQ</given-names>
            </name>
            <name name-style="western">
              <surname>Poldrack</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Eickhoff</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Hanke</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>FAIRly big: a framework for computationally reproducible processing of large-scale data</article-title>
          <source>Sci Data</source>
          <year>2022</year>
          <month>03</month>
          <day>11</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>80</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41597-022-01163-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-022-01163-2</pub-id>
          <pub-id pub-id-type="medline">35277501</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-022-01163-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC8917149</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Lahiff</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cummings</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hollocombe</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Boskamp</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Field</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Reddyhoff</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zarebski</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Viola</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Burke</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Archibald</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bessell</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Blackwell</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Boden</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Brett</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Brett</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dundas</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Enright</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez-Beltran</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hinder</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>David Hughes</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Knight</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mano</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>McMonagle</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mellor</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mohr</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Marion</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Matthews</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>McKendrick</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mark Pooley</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Porphyre</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Reeves</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Townsend</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Turner</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Walton</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Reeve</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>FAIR data pipeline: provenance-driven data management for traceable scientific workflows</article-title>
          <source>Philos Trans A Math Phys Eng Sci</source>
          <year>2022</year>
          <month>10</month>
          <day>03</day>
          <volume>380</volume>
          <issue>2233</issue>
          <fpage>20210300</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://royalsocietypublishing.org/doi/abs/10.1098/rsta.2021.0300?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1098/rsta.2021.0300</pub-id>
          <pub-id pub-id-type="medline">35965468</pub-id>
          <pub-id pub-id-type="pmcid">PMC9376726</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ambite</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Appaji</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lander</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Rajasekar</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Turner</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Turner</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sahoo</surname>
              <given-names>SS</given-names>
            </name>
          </person-group>
          <article-title>Enabling scientific reproducibility through FAIR data management: an ontology-driven deep learning approach in the NeuroBridge project</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2022</year>
          <volume>2022</volume>
          <fpage>1135</fpage>
          <lpage>44</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37128458"/>
          </comment>
          <pub-id pub-id-type="medline">37128458</pub-id>
          <pub-id pub-id-type="pii">1165</pub-id>
          <pub-id pub-id-type="pmcid">PMC10148274</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ruiz-Olazar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rocha</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Vargas</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Braghetto</surname>
              <given-names>KR</given-names>
            </name>
          </person-group>
          <article-title>The neuroscience experiments system (NES)-a software tool to manage experimental data and its provenance</article-title>
          <source>Front Neuroinform</source>
          <year>2021</year>
          <month>1</month>
          <day>7</day>
          <volume>15</volume>
          <fpage>768615</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35069167"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fninf.2021.768615</pub-id>
          <pub-id pub-id-type="medline">35069167</pub-id>
          <pub-id pub-id-type="pmcid">PMC8777234</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moreau</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Freire</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Futrelle</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>McGrath</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Myers</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Paulson</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>The open provenance model: an overview</article-title>
          <source>Proceedings of the 2nd International Provenance and Annotation Workshop on Provenance and Annotation of Data and Processes</source>
          <year>2008</year>
          <conf-name>IPAW '08</conf-name>
          <conf-date>June 17-18, 2008</conf-date>
          <conf-loc>Salt Lake City, UT</conf-loc>
          <fpage>323</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://link.springer.com/chapter/10.1007/978-3-540-89965-5_31"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/978-3-540-89965-5_31</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Morrison</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Moye</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pandita</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Mapping the field of software life cycle security metrics</article-title>
          <source>Inf Softw Technol</source>
          <year>2018</year>
          <month>10</month>
          <volume>102</volume>
          <fpage>146</fpage>
          <lpage>59</lpage>
          <pub-id pub-id-type="doi">10.1016/j.infsof.2018.05.011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref88">
        <label>88</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gierend</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Freiesleben</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kadioglu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Siegel</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ganslandt</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Waltemath</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>The status of data management practices across German medical data integration centers: mixed methods study</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>11</month>
          <day>08</day>
          <volume>25</volume>
          <fpage>e48809</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e48809/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48809</pub-id>
          <pub-id pub-id-type="medline">37938878</pub-id>
          <pub-id pub-id-type="pii">v25i1e48809</pub-id>
          <pub-id pub-id-type="pmcid">PMC10666010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref89">
        <label>89</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wing</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>The data life cycle</article-title>
          <source>Harv Data Sci Rev</source>
          <year>2019</year>
          <month>06</month>
          <day>23</day>
          <issue>1.1</issue>
          <fpage>1</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1162/99608f92.e26845b4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref90">
        <label>90</label>
        <nlm-citation citation-type="web">
          <article-title>ISO 8000-2:2022 data quality</article-title>
          <source>International Organization for Standardization</source>
          <access-date>2022-12-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.iso.org/standard/85032.html">https://www.iso.org/standard/85032.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref91">
        <label>91</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gierend</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wodke</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Genehr</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gött</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Henkel</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Krüger</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Mandalka</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Michaelis</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Scheuerlein</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schröder</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zeleke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Waltemath</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>TAPP: defining standard provenance information for clinical research data and workflows - obstacles and opportunities</article-title>
          <source>Proceedings of the 2023 ACM Web Conference</source>
          <year>2023</year>
          <conf-name>WWW '23</conf-name>
          <conf-date>April 30-May 1, 2023</conf-date>
          <conf-loc>Austin, TX</conf-loc>
          <fpage>1551</fpage>
          <lpage>4</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/3543873.3587562"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3543873.3587562</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref92">
        <label>92</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sembay</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>de Macedo</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Júnior</surname>
              <given-names>LP</given-names>
            </name>
            <name name-style="western">
              <surname>Braga</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Sarasa-Cabezuelo</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Provenance data management in health information systems: a systematic literature review</article-title>
          <source>J Pers Med</source>
          <year>2023</year>
          <month>06</month>
          <day>13</day>
          <volume>13</volume>
          <issue>6</issue>
          <fpage>991</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=jpm13060991"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/jpm13060991</pub-id>
          <pub-id pub-id-type="medline">37373980</pub-id>
          <pub-id pub-id-type="pii">jpm13060991</pub-id>
          <pub-id pub-id-type="pmcid">PMC10303902</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref93">
        <label>93</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kitchenham</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Charters</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Guidelines for performing systematic literature reviews in software engineering</article-title>
          <source>School of Computer Science and Mathematics</source>
          <year>2007</year>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://legacyfileshare.elsevier.com/promis_misc/525444systematicreviewsguide.pdf">https://legacyfileshare.elsevier.com/promis_misc/525444systematicreviewsguide.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref94">
        <label>94</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dar</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Helfert</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Data provenance in healthcare: approaches, challenges, and future directions</article-title>
          <source>Sensors (Basel)</source>
          <year>2023</year>
          <month>07</month>
          <day>18</day>
          <volume>23</volume>
          <issue>14</issue>
          <fpage>6495</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=s23146495"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/s23146495</pub-id>
          <pub-id pub-id-type="medline">37514788</pub-id>
          <pub-id pub-id-type="pii">s23146495</pub-id>
          <pub-id pub-id-type="pmcid">PMC10384601</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref95">
        <label>95</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johns</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Meurers</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wirth</surname>
              <given-names>FN</given-names>
            </name>
            <name name-style="western">
              <surname>Haber</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Halilovic</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Balzer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Prasser</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Data provenance in biomedical research: scoping review</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>03</month>
          <day>27</day>
          <volume>25</volume>
          <fpage>e42289</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e42289/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/42289</pub-id>
          <pub-id pub-id-type="medline">36972116</pub-id>
          <pub-id pub-id-type="pii">v25i1e42289</pub-id>
          <pub-id pub-id-type="pmcid">PMC10132013</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
