<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v28i1e83369</article-id>
      <article-id pub-id-type="pmid">42054696</article-id>
      <article-id pub-id-type="doi">10.2196/83369</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Viewpoint</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Viewpoint</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Rethinking Trust in Synthetic Health Data: Lessons From 7 European Research Initiatives</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Liu</surname>
            <given-names>Dan</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Deschepper</surname>
            <given-names>Mieke</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Busatta</surname>
            <given-names>Lucia</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Jackson</surname>
            <given-names>Nicholas</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Hashemi</surname>
            <given-names>Atiye</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Declerck</surname>
            <given-names>Jens</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <address>
            <institution>The European Institute for Innovation through Health Data</institution>
            <addr-line>Merebaaistraat 10</addr-line>
            <addr-line>Oosterzele, 9860</addr-line>
            <country>Belgium</country>
            <phone>32 0474538199</phone>
            <email>jens.declerck@i-hd.eu</email>
          </address>
          <xref rid="aff02" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9743-9188</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Kalra</surname>
            <given-names>Dipak</given-names>
          </name>
          <degrees>Prof Dr</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2998-9882</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Airola</surname>
            <given-names>Antti</given-names>
          </name>
          <xref rid="aff03" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1010-4386</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Amer</surname>
            <given-names>Ahmed Youssef Ali</given-names>
          </name>
          <xref rid="aff04" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5347-9009</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Chatzichristos</surname>
            <given-names>Christos</given-names>
          </name>
          <xref rid="aff05" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9054-5340</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>del Mar Mañu Pereira</surname>
            <given-names>Maria</given-names>
          </name>
          <xref rid="aff06" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4770-7460</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>M. de Brito Robalo</surname>
            <given-names>Bruno</given-names>
          </name>
          <xref rid="aff07" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9957-5039</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Ghini</surname>
            <given-names>Francesco</given-names>
          </name>
          <xref rid="aff08" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6746-4542</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Gutierrez-Torre</surname>
            <given-names>Alberto</given-names>
          </name>
          <xref rid="aff09" ref-type="aff">9</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5548-3359</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Hoogteijling</surname>
            <given-names>Sem</given-names>
          </name>
          <xref rid="aff10" ref-type="aff">10</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4455-6700</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Hultsch</surname>
            <given-names>Susanne</given-names>
          </name>
          <xref rid="aff11" ref-type="aff">11</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6739-1665</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author">
          <name name-style="western">
            <surname>Ramon</surname>
            <given-names>Jan</given-names>
          </name>
          <xref rid="aff12" ref-type="aff">12</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0558-7176</ext-link>
        </contrib>
        <contrib id="contrib13" contrib-type="author">
          <name name-style="western">
            <surname>Reidel</surname>
            <given-names>Sara</given-names>
          </name>
          <xref rid="aff13" ref-type="aff">13</xref>
          <xref rid="aff14" ref-type="aff">14</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1887-9538</ext-link>
        </contrib>
        <contrib id="contrib14" contrib-type="author">
          <name name-style="western">
            <surname>Regazzoni</surname>
            <given-names>Francesco</given-names>
          </name>
          <xref rid="aff15" ref-type="aff">15</xref>
          <xref rid="aff16" ref-type="aff">16</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6385-0780</ext-link>
        </contrib>
        <contrib id="contrib15" contrib-type="author">
          <name name-style="western">
            <surname>Silva</surname>
            <given-names>Luís</given-names>
          </name>
          <xref rid="aff17" ref-type="aff">17</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9811-0571</ext-link>
        </contrib>
        <contrib id="contrib16" contrib-type="author">
          <name name-style="western">
            <surname>Silveira</surname>
            <given-names>Inês</given-names>
          </name>
          <xref rid="aff17" ref-type="aff">17</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0675-3444</ext-link>
        </contrib>
        <contrib id="contrib17" contrib-type="author">
          <name name-style="western">
            <surname>Sofia</surname>
            <given-names>Tsekeridou</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff18" ref-type="aff">18</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3830-1936</ext-link>
        </contrib>
        <contrib id="contrib18" contrib-type="author">
          <name name-style="western">
            <surname>Maes</surname>
            <given-names>Christophe</given-names>
          </name>
          <xref rid="aff01" ref-type="aff">1</xref>
          <xref rid="aff02" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0007-7114-0675</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff01">
        <label>1</label>
        <institution>The European Institute for Innovation through Health Data</institution>
        <addr-line>Oosterzele</addr-line>
        <country>Belgium</country>
      </aff>
      <aff id="aff02">
        <label>2</label>
        <institution>Unit of Medical Informatics and Statistics</institution>
        <institution>Department of Public Health and Primary Care</institution>
        <institution>The University of Ghent</institution>
        <addr-line>Ghent</addr-line>
        <country>Belgium</country>
      </aff>
      <aff id="aff03">
        <label>3</label>
        <institution>Department of Computing</institution>
        <institution>University of Turku</institution>
        <addr-line>Turku</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff04">
        <label>4</label>
        <institution>Innovative Medicine</institution>
        <institution>Johnson &#38; Johnson</institution>
        <addr-line>Beerse</addr-line>
        <country>Belgium</country>
      </aff>
      <aff id="aff05">
        <label>5</label>
        <institution>Department of Electrical Engineering</institution>
        <institution>KU Leuven</institution>
        <addr-line>Leuven</addr-line>
        <country>Belgium</country>
      </aff>
      <aff id="aff06">
        <label>6</label>
        <institution>University Hospital Vall d'Hebron</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff07">
        <label>7</label>
        <institution>Department of Obstetrics and Gynaecology</institution>
        <institution>Erasmus MC</institution>
        <institution>University Medical Center</institution>
        <addr-line>Rotterdam</addr-line>
        <country>The Netherlands</country>
      </aff>
      <aff id="aff08">
        <label>8</label>
        <institution>Laboratory of Translational Research</institution>
        <addr-line>Reggio Emilia</addr-line>
        <country>Italy</country>
      </aff>
      <aff id="aff09">
        <label>9</label>
        <institution>Barcelona Supercomputing Center</institution>
        <addr-line>Barcelona, Catalonia</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff10">
        <label>10</label>
        <institution>Department of Neurology and Neurosurgery</institution>
        <institution>University Medical Center Utrecht Brain Center</institution>
        <addr-line>Utrecht</addr-line>
        <country>The Netherlands</country>
      </aff>
      <aff id="aff11">
        <label>11</label>
        <institution>VEIL.AI</institution>
        <addr-line>Helsinki</addr-line>
        <country>Finland</country>
      </aff>
      <aff id="aff12">
        <label>12</label>
        <institution>Institut national de recherche en sciences et technologies du numérique</institution>
        <addr-line>Lille</addr-line>
        <country>France</country>
      </aff>
      <aff id="aff13">
        <label>13</label>
        <institution>Vall d'Hebron Research Institute</institution>
        <institution>University Hospital Vall d'Hebron</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff14">
        <label>14</label>
        <institution>BarcelonaTech (UPC)</institution>
        <institution>Universitat Politècnica de Catalunya</institution>
        <addr-line>Barcelona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff15">
        <label>15</label>
        <institution>University of Amsterdam</institution>
        <addr-line>Amsterdam</addr-line>
        <country>The Netherlands</country>
      </aff>
      <aff id="aff16">
        <label>16</label>
        <institution>Università della Svizzera italiana</institution>
        <addr-line>Lugano, Ticino</addr-line>
        <country>Switzerland</country>
      </aff>
      <aff id="aff17">
        <label>17</label>
        <institution>Laboratory for Instrumentation, Biomedical Engineering and Radiation Physics</institution>
        <institution>NOVA School of Science and Technology</institution>
        <addr-line>Caparica</addr-line>
        <country>Portugal</country>
      </aff>
      <aff id="aff18">
        <label>18</label>
        <institution>Netcompany BELUX</institution>
        <addr-line>Athens</addr-line>
        <country>Greece</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Jens Declerck <email>jens.declerck@i-hd.eu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>29</day>
        <month>4</month>
        <year>2026</year>
      </pub-date>
      <volume>28</volume>
      <elocation-id>e83369</elocation-id>
      <history>
        <date date-type="received">
          <day>1</day>
          <month>9</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>29</day>
          <month>10</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>4</day>
          <month>3</month>
          <year>2026</year>
        </date>
        <date date-type="accepted">
          <day>24</day>
          <month>3</month>
          <year>2026</year>
        </date>
      </history>
      <copyright-statement>©Jens Declerck, Dipak Kalra, Antti Airola, Ahmed Youssef Ali Amer, Christos Chatzichristos, Maria del Mar Mañu Pereira, Bruno M. de Brito Robalo, Francesco Ghini, Alberto Gutierrez-Torre, Sem Hoogteijling, Susanne Hultsch, Jan Ramon, Sara Reidel, Francesco Regazzoni, Luís Silva, Inês Silveira, Tsekeridou Sofia, Christophe Maes. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 29.04.2026.</copyright-statement>
      <copyright-year>2026</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2026/1/e83369" xlink:type="simple"/>
      <abstract>
        <p>Synthetic data generation (SDG) structured health data is increasingly promoted as a solution to longstanding barriers in health data access. It is offering the promise of privacy-preserving data reuse for research, innovation, and policy. Despite rapid technical advances, the adoption of synthetic health data in real-world settings remains limited. Shaped by challenges around data quality, representativeness, infrastructure readiness, trust, and legal uncertainty, this viewpoint draws on experiences from 7 European research initiatives within the HealthData4EU cluster to reflect on how SDG is being operationalized in practice. It synthesizes cross-project insights to highlight recurring methodological and governance tensions and to examine their implications for trust and responsible use. The analysis argues that trustworthy SDG cannot be achieved through technical optimization alone but requires alignment between evaluation practices, upstream data stewardship, regulatory clarity, and sustained stakeholder engagement. Addressing these conditions is essential for moving synthetic data from experimental pilots toward a credible and sustainable component of European health research ecosystems.</p>
      </abstract>
      <kwd-group>
        <kwd>health data quality</kwd>
        <kwd>synthetic data generation</kwd>
        <kwd>health data</kwd>
        <kwd>data quality dimensions</kwd>
        <kwd>privacy</kwd>
        <kwd>project</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>As health care systems are largely digitized and become increasingly data-driven, access to large-scale, high-quality data is essential for clinical research [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>], digital health innovation [<xref ref-type="bibr" rid="ref4">4</xref>], and evidence-based policymaking [<xref ref-type="bibr" rid="ref5">5</xref>]. However, accessing patient-level health data remains a persistent challenge [<xref ref-type="bibr" rid="ref6">6</xref>]. Privacy regulations [<xref ref-type="bibr" rid="ref7">7</xref>], data quality issues [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>], and data fragmentation [<xref ref-type="bibr" rid="ref10">10</xref>] continue to limit data access and sharing, especially in cross-organizational studies [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. These barriers not only slow innovation but also risk underrepresenting certain diseases and populations, such as rare conditions, in secondary data use. As a result, many promising analytical and clinical applications struggle to move beyond pilots.</p>
      <p>Synthetic data generation (SDG) has emerged as a promising response to the barriers limiting access and reuse of patient-level health data [<xref ref-type="bibr" rid="ref12">12</xref>]. By producing synthetic datasets that resemble the statistical and structural properties of real health data, without exposing personal identities, SDG can drive innovation while maintaining privacy [<xref ref-type="bibr" rid="ref7">7</xref>]. It enables safer collaboration across different types of health data (eg, electronic health records, genomics, medical imaging) and offers value in areas such as artificial intelligence (AI) development [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref13">13</xref>], rare disease research [<xref ref-type="bibr" rid="ref14">14</xref>], and model testing [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. The main aim of SDG is to retain the essential characteristics of original datasets while retaining privacy (in most use cases). These can be grouped into quantitative [<xref ref-type="bibr" rid="ref16">16</xref>] (eg, statistical metrics, analytical patterns, signal-based features), qualitative [<xref ref-type="bibr" rid="ref16">16</xref>] (eg, expert-driven assessments), and domain-specific attributes [<xref ref-type="bibr" rid="ref17">17</xref>] that depend on the data type and specific use case. Conceptual work has also emphasized the importance of incorporating domain knowledge into SDG processes to improve realism and relevance for clinical applications [<xref ref-type="bibr" rid="ref18">18</xref>]. Despite this growing interest, the adoption of synthetic health data in real-world research and clinical environments remains limited [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. Concerns persist regarding data quality, representativeness, interpretability, and legal status [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>], as well as the uncertainty about how synthetic data exceed what current methods and data infrastructures can deliver [<xref ref-type="bibr" rid="ref13">13</xref>]. This gap between promise and practice has contributed to skepticism among multiple stakeholders, for whom trust in data sources is essential [<xref ref-type="bibr" rid="ref22">22</xref>]. This lack of trust is partly explained by the focus of SDG literature on technical methods and evaluation metrics [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>] while giving limited attention to the organizational, legal, and sociotechnical conditions that shape real-world adoption [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref22">22</xref>].</p>
      <p>Several EU-funded initiatives are currently testing SDG in real-world health research settings, all facing a shared question: how can synthetic health data be made trustworthy, useful, and safe? Despite this activity, there has been limited cross-initiative reflection on how these challenges are being addressed in practice.</p>
      <p>The aim of this viewpoint is to examine why trust in synthetic health data remains fragile despite growing technical maturity and to reflect on the nontechnical conditions required for its responsible adoption. This article is intended for health data researchers, clinicians, data stewards, infrastructure developers, regulators, and policymakers engaged in secondary use of health data across Europe. This article provides a viewpoint informed by experiences from 7 European research initiatives within the HealthData4Eu cluster that work with structured synthetic health data. It synthesizes cross-project insights to highlight recurring challenges related to data quality, interoperability, regulatory alignment, and stakeholder acceptance and reflects on their implications for trust, governance, and responsible use of synthetic data in European health research.</p>
      <sec>
        <title>Basis of This Viewpoint</title>
        <sec>
          <title>Scope and Context of the Included Projects</title>
          <p>This viewpoint is informed by 7 EU-funded projects that constitute the HealthData4EU cluster, a Horizon Europe initiative focused on advancing SDG and secure data use in health research across Europe. Collectively, these projects address complementary aspects of the synthetic data landscape, including data generation methods, federated and privacy-preserving architectures, secure data sharing, and AI-enabled clinical applications. All operate within a shared European policy and funding framework while engaging with diverse clinical and institutional contexts relevant to the European Health Data Space.</p>
          <p>The included initiatives represent the full set of synthetic data projects participating in the HealthData4EU cluster at the time of writing. While they operate within a shared European policy and funding framework, they span a wide range of clinical domains, data modalities (eg, tabular, imaging, longitudinal, multimodal data), and technical approaches. This diversity within a coordinated structure provides a useful basis for reflecting on how SDG is being operationalized across health care settings and where common challenges and tensions emerge. An overview of the participating initiatives with their clinical domains is provided in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Overview of projects, clinical domains, and example use cases involving synthetic data.</p>
            </caption>
            <table border="1" rules="groups" cellpadding="5" frame="hsides" width="1000" cellspacing="0">
              <col width="150"/>
              <col width="370"/>
              <col width="480"/>
              <thead>
                <tr valign="top">
                  <td>Project</td>
                  <td>Clinical domain(s)</td>
                  <td>Example use cases</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>AISym4MED</td>
                  <td>Neurological and chronic diseases (ie, diffuse large B-cell lymphoma, lung cancer, multiple myeloma, Alzheimer disease, type 2 diabetes, breast cancer)</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Synthetic data for multimodal applications</p>
                      </list-item>
                      <list-item>
                        <p>Support for AI<sup>a</sup> model testing</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>FLUTE</td>
                  <td>Oncology (prostate cancer)</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Risk stratification</p>
                      </list-item>
                      <list-item>
                        <p>Federated AI validation for prostate cancer diagnosis</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>PHASE IV AI</td>
                  <td>Oncology and neurology (ie, lung cancer, prostate cancer, ischemic stroke)</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Early lung cancer detection</p>
                      </list-item>
                      <list-item>
                        <p>Synthetic magnetic resonance imaging for stroke and model testing</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>PHEMS</td>
                  <td>Pediatric diseases (ie, congenital cardiac conditions, sepsis, hemophilia)</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Sepsis prediction in pediatric intensive care units</p>
                      </list-item>
                      <list-item>
                        <p>Hemophilia care optimization</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>SECURED</td>
                  <td>Multiple domains (i.e.ie, mammography, histopathology, chest radiography, cardiotocography)</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Privacy-preserving SDG<sup>b</sup></p>
                      </list-item>
                      <list-item>
                        <p>Federated AI tool development</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>SYNTHEMA</td>
                  <td>Rare hematological diseases (ie, sickle-cell disease, acute myeloid leukemia)</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Synthetic datasets for rare disease research</p>
                      </list-item>
                      <list-item>
                        <p>Federated validation</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>SYNTHIA</td>
                  <td>Multimodal and personalized medicine</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Benchmarking and validation of SDG methods across diverse clinical scenarios</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>AI: artificial intelligence.</p>
              </fn>
              <fn id="table1fn2">
                <p><sup>b</sup>SDG: synthetic data generation.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <p>The insights synthesized in this paper draw on cross-project engagement conducted during the active lifetime of the initiatives. These insights were informed by cluster-level workshops, project presentations, and recurring exchanges among project teams and by review of the project documentation during the active implementation phase. Importantly, these interactions took place while projects were still ongoing, allowing challenges and emerging practices to be discussed as they arose rather than retrospectively. The exchanges involved multidisciplinary contributors, including technical developers, clinicians, data stewards, infrastructure providers, and legal and ethical experts.</p>
          <p>While these insights are not derived form a formal empirical study, they reflect sustained, longitudinal engagement with projects that are actively developing and validating the real-world use of synthetic health data within regulated clinical and research environments. To improve transparency and address requests for additional project-level context, we have incorporated a table in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> providing a descriptive overview of the included projects.</p>
        </sec>
      </sec>
      <sec>
        <title>Lessons From 7 SDG Projects</title>
        <sec>
          <title>A Shared Landscape of Methodological Tensions</title>
          <p>Across projects, SDG is not pursued as a single technical task but as a complex sociotechnical intervention embedded in heterogeneous health systems [<xref ref-type="bibr" rid="ref22">22</xref>]. In practice, SDG sits at the intersection of machine learning, clinical data infrastructures, regulatory governance, and institutional trust.</p>
          <p>Despite differences in disease focus, data modalities, and maturity, projects consistently encounter several recurring challenges that shape how SDG is operationalized in practice. Across the initiatives examined in this paper, 3 themes emerged repeatedly: the absence of shared consensus on how synthetic data quality should be defined and evaluated, the limitations of existing data infrastructures to support reliable SDG workflows, and uncertainty surrounding the regulatory and governance status of synthetic data. These challenges reflect the structural characteristics of health data ecosystems, where technical innovation must coexist with legal safeguards, clinical accountability, and fragmented infrastructures. Understanding SDG through these challenges helps explain why synthetic data adoption remains difficult to scale beyond pilot environments.</p>
        </sec>
        <sec>
          <title>Data Quality Without Consensus</title>
          <p>A central tension concerns how “data quality” in synthetic health data is defined and demonstrated. In practice, data quality is assessed through overlapping but fragmented lenses: statistical fidelity, analytical or clinical utility, and privacy protection. These dimensions are widely acknowledged across initiatives, yet there is no shared understanding of how they should be balanced, prioritized, or interpreted in different contexts [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
          <p>Existing tools and metrics often assume that real-world source data are themselves unbiased, complete, and representative [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. This assumption is rarely valid in health systems shaped by structural inequities, fragmented data capture, and variable clinical practices across institutions and regions. When real data reflect structural inequities or incomplete capture, synthetic data derived from them may inherit the same distortions [<xref ref-type="bibr" rid="ref20">20</xref>].</p>
          <p>As a result, SDG risks reinforcing existing biases rather than mitigating them. While synthetic data are frequently promoted as a mechanism for improving representativeness or enabling rare disease research, representational properties are frequently assessed primarily at the level of the resulting dataset [<xref ref-type="bibr" rid="ref6">6</xref>]. In practice, however, representativeness is shaped not only by the quality of the synthetic generation process but also by the characteristics of the underlying source data and the transformations applied during the data lifecycle (eg, data extraction, harmonization, mapping to common data models, other extraction transfer load steps) [<xref ref-type="bibr" rid="ref25">25</xref>]. These can introduce or amplify biases by selectively filtering variables, standardizing heterogeneous data sources, or excluding smaller subpopulations. These upstream influences may remain difficult to detect when evaluation focuses primarily on statistical similarity. As a result, population coverage and the potential impact of data preparation processes on representation may receive less attention in current evaluation practices.</p>
          <p>In this sense, data quality cannot be reduced to statistical resemblance alone. We argue that there is a need for a more explicit data quality assessment at source and across the data lifecycle. In that sense, results need to be interpreted in relation to the populations, decisions, and governance contexts in which synthetic data are intended to be used.</p>
        </sec>
        <sec>
          <title>Infrastructure as a Bottleneck to Trust</title>
          <p>Federated and decentralized SDG architectures are frequently presented as solutions to privacy and governance constraints [<xref ref-type="bibr" rid="ref13">13</xref>]. In practice, infrastructure maturity at data sources emerges as a critical limiting factor. Heterogeneous hospital IT systems, inconsistent data models, and uneven data governance practices complicate federated training and validation. These challenges affect not only technical integration but also the reliability of data inputs and the feasibility of data quality assessments.</p>
          <p>Interoperability challenges persist even when projects adopt common data models such as the Observational Medical Outcomes Partnership Common Data Model. Differences in local coding practices, laboratory workflows, and semantic interpretation (eg, variation in LOINC [Logical Observation Identifiers Names and Codes] mappings for similar laboratory measurements) require substantial upfront coordination. These nuances complicate federated validation and cross-site comparability, reinforcing that standardization alone does not eliminate heterogeneity in real-world health data. Within the HealthData4EU cluster, several projects reported that aligning local coding practices and laboratory mappings across institutions required substantial preprocessing effort before federated SDG or validation could be performed.</p>
          <p>These infrastructural constraints shape what forms of SDG are feasible and who can participate, reinforcing a gap between technical potential and institutional readiness.</p>
        </sec>
      </sec>
      <sec>
        <title>Trust, Transparency, and Regulatory Uncertainty</title>
        <sec>
          <title>Trust is Not Guaranteed by Compliance</title>
          <p>Most initiatives emphasize compliance with data protection and ethical frameworks. While compliance is necessary, it is not sufficient to generate trust. Trust emerges through transparency, interpretability, and meaningful stakeholder engagement across the SDG lifecycle [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
          <p>In practice, these dimensions are unevenly operationalized. Some initiatives invest in dataset documentation, model cards, and participatory validation involving clinicians or data stewards. Others limit engagement to formal approval processes or internal review. This variability affects adoption, particularly in clinical and regulatory contexts where accountability and explainability are essential.</p>
          <p>In the European context, this includes emerging obligations under the EU Artificial Intelligence Act, specific for high-risk medical AI systems, where the provenance and validation of training data, including synthetic data, may become subject to increased scrutiny.</p>
        </sec>
        <sec>
          <title>The Unresolved Legal Status of Synthetic Data</title>
          <p>Regulatory ambiguity remains one of the most significant barriers to uptake. Synthetic data are often assumed to fall outside data protection regulation, yet institutions frequently adopt conservative interpretations, particularly of rare diseases or small cohorts [<xref ref-type="bibr" rid="ref26">26</xref>]. The absence of harmonized guidance leaves data controllers and ethics boards navigating uncertainty case by case.</p>
          <p>Clarification is particularly needed in relation to General Data Protection Regulation (GDPR) anonymization thresholds, the interaction with the EU Artificial Intelligence Act, and national interpretations by data protection authorities and ethics committees.</p>
          <p>This uncertainty raises a fundamental but often unspoken question: what is the value of synthetic data if it cannot be confidently reused beyond its original context? If synthetic datasets remain confined to local pilots due to legal or institutional caution, their potential to support cross-border research, reproducibility, and capacity building is limited. Addressing reusability therefore becomes central to the trust debate, linking legal clarity, documentation, and transparent validation of the broader promise of synthetic data as a shared research asset rather than a one-off technical item.</p>
        </sec>
        <sec>
          <title>Emerging Responses and Their Limits</title>
          <p>Encouragingly, initiatives are beginning to respond through federated validation pipelines, benchmarking libraries, interoperability standards, and public-facing platforms. However, these responses remain fragmented, and no shared consensus has yet emerged on what constitutes trustworthy SDG across contexts.</p>
        </sec>
        <sec>
          <title>Reflections and Recommendations</title>
          <p>The experiences discussed in this article suggest that SDG in health research has reached a point where technical feasibility is no longer the primary bottleneck. Instead, progress increasingly depends on how synthetic data are evaluated, governed, communicated, and trusted in practice.</p>
          <p>First, there is a need to reframe how success in SDG is defined and assessed. Much of the current emphasis remains on demonstrating technical performance, such as statistical similarity or model accuracy. While these measures are important, they do not on their own indicate whether synthetic data are appropriate for research or operational contexts. In practice, synthetic datasets may serve different purposes (eg, exploratory analysis, educational use, or hypothesis testing). These uses imply different expectations regarding the level of fidelity, reliability, and validation required. Clarifying the intended context of use can therefore help guide how synthetic datasets are evaluated and interpreted. This does not imply that all potential analytical applications must be evaluated in advance, but rather that evaluation strategies should be transparent about the contexts for which synthetic datasets are considered suitable. At the same time, general evaluation metrics remain essential to characterize the overall fidelity and privacy properties of synthetic datasets. In many cases, findings derived from exploratory analysis using synthetic data may subsequently require validation using the original data sources where appropriate access mechanisms exist.</p>
          <p>Second, greater attention should be given to data stewardship and governance upstream of SDG. Synthetic data reflects the characteristics and limitations of the infrastructures from which it is generated. Without robust practices for data quality management, interoperability, and documentation at source, SDG risks perpetuating existing shortcomings rather than addressing them. Aligning SDG initiatives with broader efforts to strengthen health data infrastructures would therefore increase both the reliability of synthetic outputs and institutional confidence in their reuse.</p>
          <p>Third, addressing the legal uncertainty surrounding synthetic health data is essential for wider adoption. In the absence of shared guidance, institutions often adopt cautious positions that limit reuse, particularly in sensitive or cross-border contexts. Developing common interpretations, best practices, or certification pathways that clarify when synthetic data can be considered sufficiently anonymized would provide a more stable foundation for decision-making. Such approaches would not eliminate the need for contextual oversight, but they would reduce fragmentation and support more consistent application of safeguards.</p>
          <p>Finally, trust building must be recognized as an active and ongoing process. Trust does not arise automatically from compliance with legal or ethical requirements nor from technical sophistication alone. It depends on transparency, interpretability, and the ability of stakeholders to understand how synthetic data were generated, evaluated, and intended to be used. Embedding mechanisms such as clear documentation, accessible validation summaries, and engagement with clinicians, data stewards, and other end users can support accountability and enable more nuanced judgments about risk and value.</p>
          <p>Overall, these reflections point to a broader shift in focus: from demonstrating that synthetic data can be generated to establishing the conditions under which it can be used responsibly, communicated transparently, and governed consistently. Advancing SDG along this path will require coordination across technical, institutional, and regulatory domains. If achieved, synthetic data can become not only a powerful analytical tool but also a credible and trusted component of health research ecosystems.</p>
        </sec>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Overview of all HealthData4EU projects, their objectives, data modalities, use cases, and methodological challenges.</p>
        <media xlink:href="jmir_v28i1e83369_app1.docx" xlink:title="DOCX File , 43 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">GDPR</term>
          <def>
            <p>General Data Protection Regulation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">LOINC</term>
          <def>
            <p>Logical Observation Identifiers Names and Codes</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">SDG</term>
          <def>
            <p>synthetic data generation</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors would like to thank all 7 HealthData4EU projects for their valuable input, collaboration, and contributions to this paper. Their openness and insights were essential to shaping the cross-case analysis. The authors are also grateful to Iraia Nuñez and Anna Lorenzini for their dedicated coordination and communications support. While not involved in the technical content of this study, their efforts in organizing exchanges and facilitating collaboration across the projects played a vital role in enabling this synthesis. No generative artificial intelligence tools were used in the generation of this paper.</p>
    </ack>
    <notes>
      <sec>
        <title>Funding</title>
        <p>This paper was funded by the Innovative Health Initiative through the SYNTHIA project. The study draws on insights from 7 research projects that form part of the HealthData4EU cluster. Projects within the cluster and their funding sources are as follows. SYNTHEMA, PHASE IV AI, SECURED, FLUTE, and AISym4MED are funded by the Horizon Europe program. PHEMS is funded by Horizon Europe and UK Research and Innovation. SYNTHIA is funded through the Innovative Health Initiative.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>SH is employed by VEIL.AI, a company developing data anonymization technologies. The work presented in this manuscript was conducted as part of the PHEMS consortium and was not influenced by the employer, and SH declares no direct financial or commercial interests related to this publication. The other authors have no conflicts of interest to declare.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eden</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Burton-Jones</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Staib</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Effects of eHealth on hospital practice: synthesis of the current literature</article-title>
          <source>Aust Health Rev</source>
          <year>2018</year>
          <month>09</month>
          <volume>42</volume>
          <issue>5</issue>
          <fpage>568</fpage>
          <lpage>578</lpage>
          <pub-id pub-id-type="doi">10.1071/AH17255</pub-id>
          <pub-id pub-id-type="medline">29986809</pub-id>
          <pub-id pub-id-type="pii">AH17255</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Abraham</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Novak</surname>
              <given-names>LL</given-names>
            </name>
            <name name-style="western">
              <surname>Reynolds</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Gettinger</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A survey of the literature on unintended consequences associated with health information technology: 2014–2015</article-title>
          <source>Yearb Med Inform</source>
          <year>2018</year>
          <month>03</month>
          <day>06</day>
          <volume>25</volume>
          <issue>01</issue>
          <fpage>13</fpage>
          <lpage>29</lpage>
          <pub-id pub-id-type="doi">10.15265/iy-2016-036</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Declerck</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Palmeri</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Oostenbrink</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Giannuzzi</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Woodworth</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Malik</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mahler</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Aurich</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Leary</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kalra</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Straub</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>The potential to leverage real-world data for pediatric clinical trials: a proof-of-concept study</article-title>
          <source>J Med Internet Res</source>
          <year>2025</year>
          <month>05</month>
          <day>30</day>
          <volume>27</volume>
          <fpage>e72573</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2025//e72573/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/72573</pub-id>
          <pub-id pub-id-type="medline">40446289</pub-id>
          <pub-id pub-id-type="pii">v27i1e72573</pub-id>
          <pub-id pub-id-type="pmcid">PMC12166320</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Penning</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zozus</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Analysis of anesthesia screens for rule-based data quality assessment opportunities</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2019</year>
          <volume>257</volume>
          <fpage>473</fpage>
          <lpage>478</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30741242"/>
          </comment>
          <pub-id pub-id-type="medline">30741242</pub-id>
          <pub-id pub-id-type="pmcid">PMC6692112</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wiebe</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Shaheen</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Eastwood</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Boussat</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Quan</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Indicators of missing electronic medical record (EMR) discharge summaries: a retrospective study on Canadian data</article-title>
          <source>Int J Popul Data Sci</source>
          <year>2020</year>
          <month>12</month>
          <day>11</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>1352</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34007880"/>
          </comment>
          <pub-id pub-id-type="doi">10.23889/ijpds.v5i3.1352</pub-id>
          <pub-id pub-id-type="medline">34007880</pub-id>
          <pub-id pub-id-type="pii">S239949082001352X</pub-id>
          <pub-id pub-id-type="pmcid">PMC8104063</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Declerck</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kalra</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Vander Stichele</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Coorevits</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Frameworks, dimensions, definitions of aspects, and assessment methods for the appraisal of quality of health data for secondary use: comprehensive overview of reviews</article-title>
          <source>JMIR Med Inform</source>
          <year>2024</year>
          <month>03</month>
          <day>06</day>
          <volume>12</volume>
          <fpage>e51560</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2024//e51560/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/51560</pub-id>
          <pub-id pub-id-type="medline">38446534</pub-id>
          <pub-id pub-id-type="pii">v12i1e51560</pub-id>
          <pub-id pub-id-type="pmcid">PMC10955383</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shabani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Marelli</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Re-identifiability of genomic data and the GDPR: assessing the re-identifiability of genomic data in light of the EU General Data Protection Regulation</article-title>
          <source>EMBO Rep</source>
          <year>2019</year>
          <month>06</month>
          <volume>20</volume>
          <issue>6</issue>
          <fpage>e48316</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.15252/embr.201948316"/>
          </comment>
          <pub-id pub-id-type="doi">10.15252/embr.201948316</pub-id>
          <pub-id pub-id-type="medline">31126909</pub-id>
          <pub-id pub-id-type="pii">embr.201948316</pub-id>
          <pub-id pub-id-type="pmcid">PMC6549023</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kahn</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Callahan</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Barnard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bauck</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Davidson</surname>
              <given-names>BN</given-names>
            </name>
            <name name-style="western">
              <surname>Estiri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Goerg</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Holve</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Liaw</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hamilton-Lopez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Meeker</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zozus</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Schilling</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>A harmonized data quality assessment terminology and framework for the secondary use of electronic health record data</article-title>
          <source>EGEMS (Wash DC)</source>
          <year>2016</year>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>1244</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27713905"/>
          </comment>
          <pub-id pub-id-type="doi">10.13063/2327-9214.1244</pub-id>
          <pub-id pub-id-type="medline">27713905</pub-id>
          <pub-id pub-id-type="pii">egems1244</pub-id>
          <pub-id pub-id-type="pmcid">PMC5051581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Declerck</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vandenberk</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Deschepper</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Colpaert</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Cool</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Goemaere</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bové</surname>
              <given-names>Mona</given-names>
            </name>
            <name name-style="western">
              <surname>Staelens</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>De Meester</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Verbeke</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Smits</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>De Decker</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Van Der Vekens</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Pauwels</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Vander Stichele</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kalra</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Coorevits</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Building a foundation for high-quality health data: multihospital case study in Belgium</article-title>
          <source>JMIR Med Inform</source>
          <year>2024</year>
          <month>12</month>
          <day>20</day>
          <volume>12</volume>
          <fpage>e60244</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2024//e60244/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/60244</pub-id>
          <pub-id pub-id-type="medline">39727158</pub-id>
          <pub-id pub-id-type="pii">v12i1e60244</pub-id>
          <pub-id pub-id-type="pmcid">PMC11683741</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Leibson</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Ransom</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Kho</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Caraballo</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chai</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Yawn</surname>
              <given-names>BP</given-names>
            </name>
            <name name-style="western">
              <surname>Pacheco</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>CG</given-names>
            </name>
          </person-group>
          <article-title>Impact of data fragmentation across healthcare centers on the accuracy of a high-throughput clinical phenotyping algorithm for specifying subjects with type 2 diabetes mellitus</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2012</year>
          <volume>19</volume>
          <issue>2</issue>
          <fpage>219</fpage>
          <lpage>24</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22249968"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000597</pub-id>
          <pub-id pub-id-type="medline">22249968</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000597</pub-id>
          <pub-id pub-id-type="pmcid">PMC3277630</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oja</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tamm</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mooses</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pajusalu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Talvik</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ott</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Laht</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Malk</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lõo</surname>
              <given-names>Marcus</given-names>
            </name>
            <name name-style="western">
              <surname>Holm</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Haug</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Šuvalov</surname>
              <given-names>Hendrik</given-names>
            </name>
            <name name-style="western">
              <surname>Särg</surname>
              <given-names>Dage</given-names>
            </name>
            <name name-style="western">
              <surname>Vilo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Laur</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kolde</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Reisberg</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Transforming Estonian health data to the Observational Medical Outcomes Partnership (OMOP) Common Data Model: lessons learned</article-title>
          <source>JAMIA Open</source>
          <year>2023</year>
          <month>12</month>
          <volume>6</volume>
          <issue>4</issue>
          <fpage>ooad100</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38058679"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamiaopen/ooad100</pub-id>
          <pub-id pub-id-type="medline">38058679</pub-id>
          <pub-id pub-id-type="pii">ooad100</pub-id>
          <pub-id pub-id-type="pmcid">PMC10697784</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gonzales</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Guruswamy</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>SR</given-names>
            </name>
          </person-group>
          <article-title>Synthetic data in health care: a narrative review</article-title>
          <source>PLOS Digit Health</source>
          <year>2023</year>
          <month>01</month>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>e0000082</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://air.unimi.it/handle/2434/235313"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pdig.0000082</pub-id>
          <pub-id pub-id-type="medline">36812604</pub-id>
          <pub-id pub-id-type="pii">PDIG-D-22-00188</pub-id>
          <pub-id pub-id-type="pmcid">PMC9931305</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Giuffrè</surname>
              <given-names>Mauro</given-names>
            </name>
            <name name-style="western">
              <surname>Shung</surname>
              <given-names>DL</given-names>
            </name>
          </person-group>
          <article-title>Harnessing the power of synthetic data in healthcare: innovation, application, and privacy</article-title>
          <source>NPJ Digit Med</source>
          <year>2023</year>
          <month>10</month>
          <day>09</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>186</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-023-00927-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-023-00927-3</pub-id>
          <pub-id pub-id-type="medline">37813960</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-023-00927-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC10562365</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Al-Dhamari</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Abu Attieh</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Prasser</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Synthetic datasets for open software development in rare disease research</article-title>
          <source>Orphanet J Rare Dis</source>
          <year>2024</year>
          <month>07</month>
          <day>15</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>265</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ojrd.biomedcentral.com/articles/10.1186/s13023-024-03254-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13023-024-03254-2</pub-id>
          <pub-id pub-id-type="medline">39010138</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13023-024-03254-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC11247768</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goncalves</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ray</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Soper</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Coyle</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sales</surname>
              <given-names>AP</given-names>
            </name>
          </person-group>
          <article-title>Generation and evaluation of synthetic patient data</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2020</year>
          <month>05</month>
          <day>07</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>108</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/s12874-020-00977-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12874-020-00977-1</pub-id>
          <pub-id pub-id-type="medline">32381039</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12874-020-00977-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7204018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mohammadi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gorde</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Jajodia</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Data synthesis based on generative adversarial networks</article-title>
          <source>Proc VLDB Endow</source>
          <year>2018</year>
          <month>06</month>
          <volume>11</volume>
          <issue>10</issue>
          <fpage>1071</fpage>
          <lpage>1083</lpage>
          <pub-id pub-id-type="doi">10.14778/3231751.3231757</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Esteban</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hyland</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rätsch</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Real-valued (medical) time series generation with recurrent conditional gans</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on December 4, 2017</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1706.02633</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hashemi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Soliman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lundström</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Etminani</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Domain knowledge-driven generation of synthetic healthcare data</article-title>
          <source>Volume 302: Caring is Sharing – Exploiting the Value in Data for Health and Innovation</source>
          <year>2023</year>
          <month>05</month>
          <day>22</day>
          <publisher-loc>Amsterdam, Netherlands</publisher-loc>
          <publisher-name>IOS Press eBooks</publisher-name>
          <fpage>352</fpage>
          <lpage>353</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ogwel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Mzazi</surname>
              <given-names>VH</given-names>
            </name>
            <name name-style="western">
              <surname>Awuor</surname>
              <given-names>AO</given-names>
            </name>
            <name name-style="western">
              <surname>Otieno</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ogolla</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nyawanda</surname>
              <given-names>BO</given-names>
            </name>
            <name name-style="western">
              <surname>Omore</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>A quarter-century of synthetic data in healthcare: Unveiling trends with structural topic modeling</article-title>
          <source>Digit Health</source>
          <year>2025</year>
          <volume>11</volume>
          <fpage>20552076251404530</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://air.unimi.it/handle/2434/235313"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/20552076251404530</pub-id>
          <pub-id pub-id-type="medline">41346942</pub-id>
          <pub-id pub-id-type="pii">10.1177_20552076251404530</pub-id>
          <pub-id pub-id-type="pmcid">PMC12673032</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alaa</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Van</surname>
              <given-names>BB</given-names>
            </name>
            <name name-style="western">
              <surname>Saveliev</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Van</surname>
              <given-names>DSM</given-names>
            </name>
          </person-group>
          <article-title>editors</article-title>
          <source>arXiv</source>
          <year>2022</year>
          <month>07</month>
          <day>13</day>
          <fpage>1</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.48550/arXiv.2102.08921</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stenger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Leppich</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Foster</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Kounev</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bauer</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Evaluation is key: a survey on evaluation measures for synthetic time series</article-title>
          <source>J Big Data</source>
          <year>2024</year>
          <month>05</month>
          <day>07</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>66</fpage>
          <pub-id pub-id-type="doi">10.1186/s40537-024-00924-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Topol</surname>
              <given-names>EJ</given-names>
            </name>
          </person-group>
          <article-title>High-performance medicine: the convergence of human and artificial intelligence</article-title>
          <source>Nat Med</source>
          <year>2019</year>
          <month>01</month>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>44</fpage>
          <lpage>56</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-018-0300-7</pub-id>
          <pub-id pub-id-type="medline">30617339</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-018-0300-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jordon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Szpruch</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Houssiau</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Bottarelli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cherubin</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Maple</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Synthetic data -- what, why and how?</article-title>
          <source>ArXiv</source>
          <comment>Preprint posted online on May 6, 2022</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.2205.03257</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaabachi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Despraz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Meurers</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Otte</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Halilovic</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kulynych</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Prasser</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Raisaro</surname>
              <given-names>JL</given-names>
            </name>
          </person-group>
          <article-title>A scoping review of privacy and utility metrics in medical synthetic data</article-title>
          <source>NPJ Digit Med</source>
          <year>2025</year>
          <month>01</month>
          <day>27</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>60</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-024-01359-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-024-01359-3</pub-id>
          <pub-id pub-id-type="medline">39870798</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-024-01359-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC11772694</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liaw</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>JGN</given-names>
            </name>
            <name name-style="western">
              <surname>Ansari</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jonnagaddala</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Godinho</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Borelli</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>de Lusignan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Capurro</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Liyanage</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Bhattal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bennett</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kahn</surname>
              <given-names>MG</given-names>
            </name>
          </person-group>
          <article-title>Quality assessment of real-world data repositories across the data life cycle: a literature review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2021</year>
          <month>07</month>
          <day>14</day>
          <volume>28</volume>
          <issue>7</issue>
          <fpage>1591</fpage>
          <lpage>1599</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://air.unimi.it/handle/2434/235313"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocaa340</pub-id>
          <pub-id pub-id-type="medline">33496785</pub-id>
          <pub-id pub-id-type="pii">6120399</pub-id>
          <pub-id pub-id-type="pmcid">PMC8475229</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pilgram</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ko</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tung</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>El Emam</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Protecting patient privacy in tabular synthetic health data: a regulatory perspective</article-title>
          <source>NPJ Digit Med</source>
          <year>2025</year>
          <month>11</month>
          <day>28</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>732</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-025-02112-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-025-02112-0</pub-id>
          <pub-id pub-id-type="medline">41315669</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-025-02112-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC12663144</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
