<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v27i1e63130</article-id>
      <article-id pub-id-type="pmid">40245392</article-id>
      <article-id pub-id-type="doi">10.2196/63130</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Short Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Short Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Generating Artificial Patients With Reliable Clinical Characteristics Using a Geometry-Based Variational Autoencoder: Proof-of-Concept Feasibility Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Coristine</surname>
            <given-names>Andrew</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chen</surname>
            <given-names>DeJiu</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Astha</surname>
            <given-names>Varuna</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Ferré</surname>
            <given-names>Fabrice</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Anesthesia, Intensive Care and Perioperative Medicine</institution>
            <institution>Purpan University Hospital</institution>
            <addr-line>Place du Dr Baylac</addr-line>
            <addr-line>Toulouse, 31300</addr-line>
            <country>France</country>
            <phone>33 561779988</phone>
            <email>fabriceferre31@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6648-7454</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Allassonnière</surname>
            <given-names>Stéphanie</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5692-4945</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Chadebec</surname>
            <given-names>Clément</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3890-1392</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Minville</surname>
            <given-names>Vincent</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0516-4939</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Anesthesia, Intensive Care and Perioperative Medicine</institution>
        <institution>Purpan University Hospital</institution>
        <addr-line>Toulouse</addr-line>
        <country>France</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Université Paris Cité, Unité Mixte de Recherche S1138, Institut national de recherche en sciences et technologies du numérique, Sorbonne University</institution>
        <addr-line>Paris</addr-line>
        <country>France</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Fabrice Ferré <email>fabriceferre31@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>17</day>
        <month>4</month>
        <year>2025</year>
      </pub-date>
      <volume>27</volume>
      <elocation-id>e63130</elocation-id>
      <history>
        <date date-type="received">
          <day>11</day>
          <month>6</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>8</day>
          <month>7</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>1</day>
          <month>11</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>17</day>
          <month>12</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Fabrice Ferré, Stéphanie Allassonnière, Clément Chadebec, Vincent Minville. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 17.04.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2025/1/e63130" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Artificial patient technology could transform health care by accelerating diagnosis, treatment, and mapping clinical pathways. Deep learning methods for generating artificial data in health care include data augmentation by variational autoencoders (VAE) technology.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aimed to test the feasibility of generating artificial patients with reliable clinical characteristics by using a geometry-based VAE applied, for the first time, on high-dimension, low-sample-size tabular data.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Clinical tabular data were extracted from 521 real patients of the “MAX” digital conversational agent (BOTdesign) created for preparing patients for anesthesia. A 3-stage methodological approach was implemented to generate up to 10,000 artificial patients: training the model and generating artificial data, assessing the consistency and confidentiality of artificial data, and validating the plausibility of the newly created artificial patients.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We demonstrated the feasibility of applying the VAE technique to tabular data to generate large artificial patient cohorts with high consistency (fidelity scores&#62;94%). Moreover, artificial patients could not be matched with real patients (filter similarity scores&#62;99%, κ coefficients of agreement&#60;0.2), thus guaranteeing the essential ethical concern of confidentiality.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This proof-of-concept study has demonstrated our ability to augment real tabular data to generate artificial patients. These promising results make it possible to envisage in silico trials carried out on large cohorts of artificial patients, thereby overcoming the pitfalls usually encountered in in vivo trials. Further studies integrating longitudinal dynamics are needed to map patient trajectories.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>digital health</kwd>
        <kwd>artificial data</kwd>
        <kwd>variational autoencoder</kwd>
        <kwd>data science</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>health monitoring</kwd>
        <kwd>deep learning</kwd>
        <kwd>medical imaging</kwd>
        <kwd>imaging</kwd>
        <kwd>magnetic resonance imaging</kwd>
        <kwd>Alzheimer disease</kwd>
        <kwd>anesthesia</kwd>
        <kwd>prediction</kwd>
        <kwd>data augmentation</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>With the growing impact of data science technologies, novel health care ecosystems centered around artificial patients are developing. The data science–based approach for generating artificial patients involves augmenting real data [<xref ref-type="bibr" rid="ref1">1</xref>]. Thus, new artificial data are created with characteristics similar to those of the original population of interest. Such data could be particularly valuable in clinical research, offering the potential for studies that are not only more cost-effective but, more importantly, also more inclusive and impactful—especially in cases where patient recruitment poses a challenge [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
      <p>From a methodological point of view, artificial labeled data are generated using mechanistic or statistical methods. The mechanistic approach combines known equations from physical, biological, or other fields to describe a phenomenon, referred to as digital twins. This approach could facilitate personalized therapeutics [<xref ref-type="bibr" rid="ref3">3</xref>], though its routine use in medical processes remains limited [<xref ref-type="bibr" rid="ref4">4</xref>]. Deep learning methods for generating artificial data in health care include technologies based on generative adversarial networks (GANs) [<xref ref-type="bibr" rid="ref5">5</xref>] or variational autoencoders (VAEs) [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. However, most of the studies using GANs focused on a fairly large training set (over 1000 training samples) or on low-dimension data, while it remains very challenging to gather such large cohorts of labeled patients. Therefore, the case of high-dimensional data combined with a small sample size (a situation commonly encountered in medicine) remains largely unexplored by GAN technologies. Chadebec et al [<xref ref-type="bibr" rid="ref1">1</xref>] have recently demonstrated, by using a VAE, that the artificial augmentation of medical imaging data significantly improved classification accuracy. The balanced accuracy increases from 66% to 74% for a convolutional neural network classifier trained with small datasets (50 magnetic resonance images each of cognitively healthy individuals and patients with Alzheimer disease), while improving greatly the sensitivity and specificity of the classification metrics [<xref ref-type="bibr" rid="ref1">1</xref>]. In other words, a geometry-based VAE was able to produce meaningful samples from high-dimension, low-sample-size (HDLSS) imaging datasets. This method, validated for an image classification task (voxels), deserves to be tested on (clinical) tabular data. Given the multiplicity and complexity of the data obtained in anesthesia, this statistical approach using artificially augmented data could be of major interest to identify predictive clinical factors of poor outcomes with accuracy and reliability. Thus, the aim of our study was to test the feasibility of generating artificial patients with reliable clinical characteristics by using a VAE applied on HDLSS tabular data.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>Clinical tabular data were extracted from 521 real patients of the MAX (BOTdesign) database. MAX is a digital conversational agent for preparing patients for anesthesia [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. Collected data included demographic characteristics, past medical history, medication, and other relevant medical items.</p>
        <p>Details of the methodological approach used to train the model and generate artificial data are available in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Briefly, the dataset included 521 patients about to undergo anesthesia, each with 85 clinical features. Once data preprocessing was completed (<xref rid="figure1" ref-type="fig">Figure 1</xref>), the model was trained on a (521, 103) dimension dataset using a modified Pyraug’s training pipeline (<xref rid="figure2" ref-type="fig">Figure 2</xref>). Training hyperparameters were set to 1000 epochs, a batch size of 32, and a learning rate of 0.001. Two datasets of 5000 and 10,000 artificial patients were generated, representing a data increase rate of 10 and 20 artificial patients, respectively, for 1 real patient.</p>
        <p>The next step involved assessing the consistency (fidelity scores) and confidentiality (filter similarity scores and degree of anonymization) of artificial data.</p>
        <p>Finally, the plausibility of newly generated artificial patients was validated through expert human supervision (categorization task).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Illustration of the data preprocessing step. MET: metabolic equivalent task.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e63130_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Illustration of the complete pipeline for generating artificial patients. For more details, see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. TDProcessor: TabularDataProcessor.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e63130_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>We did not seek ethics approval in accordance with the Commision Nationale Informatique et Libertés policy on secondary analyses of preexisting datasets (Titles I and II) [<xref ref-type="bibr" rid="ref9">9</xref>], as patients were informed that their data may be securely stored, coded for confidentiality, and used for research unless they explicitly object.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Consistency and Confidentiality of Artificial Data</title>
        <p>To assess the consistency of newly generated artificial data, fidelity scores were calculated. A fidelity score is defined as the arithmetic mean of its 3 components: numerical and categorical data distribution stability and numerical data correlation stability. Results are presented in <xref ref-type="table" rid="table1">Table 1</xref> and illustrated in <xref rid="figure3" ref-type="fig">Figures 3</xref> and <xref rid="figure4" ref-type="fig">4</xref>. Equations used to calculate stability scores for numerical and categorical data are available in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Fidelity scores and their components for the 5000 and 10,000 artificial patients generated.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="310"/>
            <col width="350"/>
            <col width="310"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Scores</td>
                <td>5000 artificial patients, %</td>
                <td>10,000 artificial patients, %</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Fidelity score</bold>
                </td>
                <td>97.8</td>
                <td>94.6</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Numerical stability</td>
                <td>100</td>
                <td>100</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Categorical stability</td>
                <td>96.4</td>
                <td>91.2</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Numerical correlation stability</td>
                <td>97.1</td>
                <td>92.6</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Distribution of (A) the numerical variable “age” and (B) the categorical variable “gender” (in relative percentage) from the datasets of 521 real and 5000 artificial patients.</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e63130_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Matrices illustrating the correlation of numerical variables from the datasets of 521 real and 5000 artificial patients (A) and (B) and their differences (C).</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e63130_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>With fidelity scores of 97.8% and 94.6%, data of the 5000 and 10,000 artificial patients were considered realistic and representative of the real data.</p>
        <p>To assess the confidentiality of newly generated artificial data, filter similarity scores (proportion of data not similar to the initial dataset) and degree of anonymization (Euclidean distance) were calculated. The results strongly confirm the nonsimilarity of the artificial data with the initial real data (filter similarity scores&#62;99.9%) and a high degree of anonymization (the artificial data were further away from the initial dataset than the initial data were from each other).</p>
      </sec>
      <sec>
        <title>Plausibility of Artificial Patients</title>
        <p>A categorization task was performed by 3 experienced anesthetists who were blinded, with the distribution of a balanced sample of 100 real and artificial patients generated using the VAE. Anesthetists were asked to determine whether each patient was real or artificial. The κ coefficients of agreement were –0.12 (95% CI –0.31 to 0.07), 0.15 (95% CI 0.1-0.26), and 0.09 (95% CI –0.14 to 0.15). Given the very low agreement coefficients (&#60;0.2), none of the 3 experts could differentiate between real and artificial patients, arguing for the medical plausibility of the artificial patients.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>Through this proof-of-concept study, we demonstrated, for the first time, the feasibility to transpose the VAE technique from imaging to HDLSS clinical data for the generation of a large number of artificial patients. The high fidelity scores obtained demonstrate the consistency of our artificial cohorts. Moreover, as suggested by the high filter similarity scores and the low agreement coefficients of the categorization task, the artificial patients could not be matched with real patients.</p>
      <p>The use of artificial intelligence (AI) in health care presents particularly complex challenges inherent in the types of data it relies on (sensitive, sparse, heterogeneous, limited, etc). However, research efforts over the last few years, which have focused on meeting these specific challenges, now offer a glimpse of dizzying potential, particularly in the field of clinical research. In silico trials on artificial patient cohorts can quickly and cost-effectively include diverse minority groups (eg, rare diseases, children, pregnant women, and ethnic minorities), reducing risks and recruitment challenges of traditional in vivo trials. In this setting, artificial patients’ technology has the potential to transform health care by improving diagnosis, treatment, and mapping clinical pathways [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
      <p>Validation of mathematical models and algorithms is important from an ethical point of view. Like any data processing, the implementation of artificial patient cohorts requires human oversight (in reference to the AI Act [<xref ref-type="bibr" rid="ref10">10</xref>]). This principle of “Human Guarantee” refers to the need not to relinquish decision-making autonomy in the context of increasingly rapid dissemination of AI. Organized in the form of human oversight committees, these control measures will help better understand the phase of modeling artificial patient populations and ensure that it is as unbiased and reliable as possible. The need to protect health data and the rights of the individuals is a matter of debate that will likely be resolved with the expected advances in anonymization. Ensuring that artificial and real data are not similar is one way of guaranteeing anonymization and confidentiality. In this setting, no real patient should be identifiable from artificial data.</p>
      <p>Our results must be interpreted with caution and a number of limitations should be borne in mind. First, our study presents promising results but does not present a comparative analysis with existing methods for generating artificial patient data (eg, GANs). In this setting, further studies designed to identify the most effective approach could be of major interest. Second, our study strongly lacks a comparative analysis with the late postoperative outcomes of real patients. Further studies integrating longitudinal dynamics are needed to map trends and identify patient trajectories. In this context, the recent update of MAX with the implementation of a postoperative digital conversational agent for the collection of recovery data based on patient-reported outcome measures could be of major interest. Indeed, we plan to compare longitudinal data from real patients with those obtained in a cohort of artificial patients. Finally, the results of our proof-of-concept study are encouraging, but it seems necessary to replicate the method. For instance, a process is underway to validate the reliability of artificial patient cohorts by replaying old clinical trials using data shared on the Yale University Open Data Access. Moreover, we plan to apply our VAE method to other kinds of data (eg, multimodal data). In this setting, the first European web platform for augmenting data and creating artificial patient cohorts with VAE’s generative AI has recently been created (ORIGA; BOTdesign).</p>
      <p>To conclude, we demonstrate, for the first time, the feasibility to augment HDLSS clinical tabular data by using a VAE. The newly generated artificial patient cohorts were consistent with real source data. We believe that in silico trials can be used to track a variety of health indicators and generate key insights. Artificial patients will revolutionize health care paving the way for a more precise, personalized, and predictive medicine.</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Additional material.</p>
        <media xlink:href="jmir_v27i1e63130_app1.docx" xlink:title="DOCX File , 176 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">GAN</term>
          <def>
            <p>generative adversarial network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">HDLSS</term>
          <def>
            <p>high-dimension, low-sample-size</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">VAE</term>
          <def>
            <p>variational autoencoder</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We would like to thank Open Studio (IA-Lab, Lyon, France) for their data analyses. We would also like to thank Olivier Thuillart and Jean-Louis Fraysse from BOTdesign (Toulouse, France), the company that created the digital companion MAX. The research leading to these results has received funding from the French government under management of Agence Nationale de la Recherche as part of the “Investissements d’avenir” program (reference ANR-19-P3IA-0001, PRAIRIE 3IA Institute; and reference ANR-10-IAIHU-06, Agence Nationale de la Recherche-10-IA Institut Hospitalo-Universitaire-6).</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>Data are available from the corresponding author upon request.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>Conceptualization: FF, SA, and VM</p>
        <p>Formal analysis: SA and CC</p>
        <p>Investigation: FF and VM</p>
        <p>Methodology: FF and SA</p>
        <p>Writing—original draft: FF, SA, CC, and VM</p>
        <p>Writing—review and editing: FF</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chadebec</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Thibeau-Sutre</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Burgos</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Allassonniere</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Data augmentation in high dimensional low sample size setting using a geometry-based variational autoencoder</article-title>
          <source>IEEE Trans Pattern Anal Mach Intell</source>
          <year>2023</year>
          <month>03</month>
          <volume>45</volume>
          <issue>3</issue>
          <fpage>2879</fpage>
          <lpage>2896</lpage>
          <pub-id pub-id-type="doi">10.1109/TPAMI.2022.3185773</pub-id>
          <pub-id pub-id-type="medline">35749321</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Recruitment and retention of participants in clinical studies: critical issues and challenges</article-title>
          <source>Perspect Clin Res</source>
          <year>2020</year>
          <volume>11</volume>
          <issue>2</issue>
          <fpage>51</fpage>
          <pub-id pub-id-type="doi">10.4103/picr.picr_6_20</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elkefi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Asan</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Digital twins for managing health care systems: rapid literature review</article-title>
          <source>J Med Internet Res</source>
          <year>2022</year>
          <month>08</month>
          <day>16</day>
          <volume>24</volume>
          <issue>8</issue>
          <fpage>e37641</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2022/8/e37641/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/37641</pub-id>
          <pub-id pub-id-type="medline">35972776</pub-id>
          <pub-id pub-id-type="pii">v24i8e37641</pub-id>
          <pub-id pub-id-type="pmcid">PMC9428772</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fischer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Volpert</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Antonino</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ahrens</surname>
              <given-names>TD</given-names>
            </name>
          </person-group>
          <article-title>Digital patient twins for personalized therapeutics and pharmaceutical manufacturing</article-title>
          <source>Front Digit Health</source>
          <year>2023</year>
          <volume>5</volume>
          <fpage>1302338</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38250053"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fdgth.2023.1302338</pub-id>
          <pub-id pub-id-type="medline">38250053</pub-id>
          <pub-id pub-id-type="pmcid">PMC10796488</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Segal</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Rubin</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Rubin</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Pantanowitz</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the clinical realism of synthetic chest x-rays generated using progressively growing GANs</article-title>
          <source>SN Comput Sci</source>
          <year>2021</year>
          <volume>2</volume>
          <issue>4</issue>
          <fpage>321</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34104898"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s42979-021-00720-7</pub-id>
          <pub-id pub-id-type="medline">34104898</pub-id>
          <pub-id pub-id-type="pii">720</pub-id>
          <pub-id pub-id-type="pmcid">PMC8176276</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allassonière</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fraysse</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>Artificial data in healthcare: analysis and areas for consideration [Article in French]</source>
          <year>2024</year>
          <access-date>2025-03-19</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://static.botdesign.net/docs/VF_Livre_blanc_Données_de_santé_artificielles-250424.pdf">https://static.botdesign.net/docs/VF_Livre_blanc_Données_de_santé_artificielles-250424.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferré</surname>
              <given-names>Fabrice</given-names>
            </name>
            <name name-style="western">
              <surname>Boeschlin</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bastiani</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Castel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrier</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bosch</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Muscari</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kurrek</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fourcade</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Piau</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Minville</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Improving provision of preanesthetic information through use of the digital conversational agent "MyAnesth": prospective observational trial</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>12</month>
          <day>04</day>
          <volume>22</volume>
          <issue>12</issue>
          <fpage>e20455</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/12/e20455/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/20455</pub-id>
          <pub-id pub-id-type="medline">33275108</pub-id>
          <pub-id pub-id-type="pii">v22i12e20455</pub-id>
          <pub-id pub-id-type="pmcid">PMC7748965</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferré</surname>
              <given-names>Fabrice</given-names>
            </name>
            <name name-style="western">
              <surname>Laurent</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Furelau</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Doumard</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrier</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bosch</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ba</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Menut</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kurrek</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Geeraerts</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Piau</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Minville</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Perioperative risk assessment of patients using the MyRISK digital score completed before the preanesthetic consultation: prospective observational study</article-title>
          <source>JMIR Perioper Med</source>
          <year>2023</year>
          <month>01</month>
          <day>16</day>
          <volume>6</volume>
          <fpage>e39044</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://periop.jmir.org/2023//e39044/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/39044</pub-id>
          <pub-id pub-id-type="medline">36645704</pub-id>
          <pub-id pub-id-type="pii">v6i1e39044</pub-id>
          <pub-id pub-id-type="pmcid">PMC9887512</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
          <article-title>Deliberation No. 2018-155 of May 3, 2018 approving the reference methodology relating to the processing of personal data implemented in the context of research not involving human beings, studies and evaluations in the field of health (MR-004)</article-title>
          <source>Commision Nationale Informatique et Libertés</source>
          <access-date>2025-04-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://tinyurl.com/3c598h7y">https://tinyurl.com/3c598h7y</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="web">
          <article-title>Article 14: Human Oversight</article-title>
          <source>EU Artificial Intelligence Act</source>
          <access-date>2024-06-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://artificialintelligenceact.eu/article/14/">https://artificialintelligenceact.eu/article/14/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
