<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v25i1e43484</article-id>
      <article-id pub-id-type="pmid">37018021</article-id>
      <article-id pub-id-type="doi">10.2196/43484</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Viewpoint</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Viewpoint</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Data Challenges for Externally Controlled Trials: Viewpoint</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kumwichar</surname>
            <given-names>Ponlagrit</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Dreyer</surname>
            <given-names>Nancy</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Velummailum</surname>
            <given-names>Russanthy Ruthiran</given-names>
          </name>
          <degrees>MSc, MPH</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5958-1223</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>McKibbon</surname>
            <given-names>Chelsea</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0783-5759</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Brenner</surname>
            <given-names>Darren R</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8577-7278</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Stringer</surname>
            <given-names>Elizabeth Ann</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7131-8874</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Ekstrom</surname>
            <given-names>Leeland</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0768-4228</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Dron</surname>
            <given-names>Louis</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Cytel, Inc</institution>
            <addr-line>777 West Broadway</addr-line>
            <addr-line>Suite 802</addr-line>
            <addr-line>Vancouver, BC, V5Z1J5</addr-line>
            <country>Canada</country>
            <phone>1 604 294 3823</phone>
            <email>louis.dron@cytel.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3276-3948</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Cytel, Inc</institution>
        <addr-line>Vancouver, BC</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Oncology</institution>
        <institution>University of Calgary</institution>
        <addr-line>Calgary, AB</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Nashville Biosciences</institution>
        <addr-line>Nashville, TN</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Louis Dron <email>louis.dron@cytel.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>5</day>
        <month>4</month>
        <year>2023</year>
      </pub-date>
      <volume>25</volume>
      <elocation-id>e43484</elocation-id>
      <history>
        <date date-type="received">
          <day>12</day>
          <month>10</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>11</day>
          <month>1</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>1</day>
          <month>2</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>19</day>
          <month>2</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Russanthy Ruthiran Velummailum, Chelsea McKibbon, Darren R Brenner, Elizabeth Ann Stringer, Leeland Ekstrom, Louis Dron. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 05.04.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2023/1/e43484" xlink:type="simple"/>
      <abstract>
        <p>The preferred evidence of a large randomized controlled trial is difficult to adopt in scenarios, such as rare conditions or clinical subgroups with high unmet needs, and evidence from external sources, including real-world data, is being increasingly considered by decision makers. Real-world data originate from many sources, and identifying suitable real-world data that can be used to contextualize a single-arm trial, as an external control arm, has several challenges. In this viewpoint article, we provide an overview of the technical challenges raised by regulatory and health reimbursement agencies when evaluating comparative efficacy, such as identification, outcome, and time selection challenges. By breaking down these challenges, we provide practical solutions for researchers to consider through the approaches of detailed planning, collection, and record linkage to analyze external data for comparative efficacy.</p>
      </abstract>
      <kwd-group>
        <kwd>external control arm</kwd>
        <kwd>synthetic control arm</kwd>
        <kwd>single-arm trial</kwd>
        <kwd>real-world evidence</kwd>
        <kwd>regulatory approval</kwd>
        <kwd>data</kwd>
        <kwd>clinical</kwd>
        <kwd>decision-making</kwd>
        <kwd>efficacy</kwd>
        <kwd>rare conditions</kwd>
        <kwd>trial</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Historically, real-world evidence from observational studies has had limited use for demonstrating therapeutic effectiveness for regulatory and reimbursement purposes. However, several recent developments, including the 21st Century Cure Act, increased accessibility to large-scale routinely collected health data, improved standardization of collection, and increased high-profile regulatory applications, and have resulted in an increased demand for these data and increased availability of these data [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. This has changed the data landscape, with growing recognition of the value of using real-world evidence that is applicable for regulatory and reimbursement purposes. Frameworks from regulatory bodies, such as the United States Food and Drug Administration (FDA) and European Medicines Agency (EMA), and reimbursement agencies, such as the National Institute for Health and Care Excellence (NICE), specifically call out the use of external data sources in conjunction with single-arm evidence, particularly in rare diseases or clinical subgroups where there is a high unmet medical need and traditional randomized controlled trials (RCTs) may not be feasible [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref7">7</xref>].</p>
      <p>Real-world evidence is derived from rigorous analyses of real-world data. Real-world data are data related to patient health status or delivery of health care outside of RCTs where sources commonly originate from electronic health records (EHRs), medical claims data, and product and disease registries [<xref ref-type="bibr" rid="ref8">8</xref>]. In addition to what may be considered common forms, real-world data from outside of traditional medical charting, including data from mobile phones, wearables, and patient-reported outcomes, have provided an abundance of data, allowing comprehensive capture of the natural course of a disease from both the physician and patient perspectives [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. Although outside of the scope of this viewpoint, data from historical clinical trials have been found to be influential in comparative efficacy analyses and have been found to have a role in supplementing an external control study through hybrid study designs [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>].</p>
      <p>Given the adoption and use of EHRs and other data content sources in general practice, real-world data and real-world evidence are being increasingly reported in publications in recent years (<xref rid="figure1" ref-type="fig">Figure 1</xref>) and are being increasingly used in health care decisions [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>].</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Number of real-world data and real-world evidence publications over time from 1965 to 2021. The following search terms have been considered in PubMed: “real-world” or “observational” or “nonrandomized” or “standard of care” or “external control” or “single-arm” or “historical-control” or “retrospective” or “noninterventional” or “case series” or “natural history” or “electronic health record” or “electronic medical record” or “claims”.</p>
        </caption>
        <graphic xlink:href="jmir_v25i1e43484_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>As the majority of criticism from regulatory and reimbursement agencies on applications using real-world data has so far focused predominantly on data features (type, quality, and frequency) and confounding and selection bias limitations, appropriate curation and evaluation of these sources are critical components of any exercise using external evidence [<xref ref-type="bibr" rid="ref16">16</xref>]. In this paper, we provide an overview of the challenges in identifying data suitable for external control arms, including common pseudonyms, such as synthetic control arms and historical controls, when evaluating comparative efficacy, and provide solutions for researchers to consider.</p>
    </sec>
    <sec>
      <title>Technical Challenges</title>
      <sec>
        <title>Challenges in Data Source Identification for Rare Conditions</title>
        <p>RCTs have long been considered the gold standard approach to evaluate the comparative effectiveness of a drug or biological product due to the standardized methods to reduce bias, including randomization and blinding, as well as balancing known and unknown confounders. These gold standard trials, however, may not reflect the real-world setting where the patient is treated [<xref ref-type="bibr" rid="ref17">17</xref>]. This is particularly notable for rare diseases, where the standard of care may be highly variable and disease definitions may change rapidly, than for nonrare indications. In the United States, a rare disease is defined as a condition that affects fewer than 200,000 individuals, with most diseases presenting in children or being oncology indications. Advancements in precision medicine have changed the rare disease paradigm, with many common diseases now being considered rare diseases by further splitting into subdiseases or considering stratification by mutated genes in common cancers [<xref ref-type="bibr" rid="ref18">18</xref>]. Research focused on rare diseases is further challenged due to limited patient recruitment and siloed efforts focused on a singular therapeutic area [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Although common diseases and cancer indications are not safeguarded from similar complexities, they can often be more acute and rate limiting in the rare disease space. Regardless, both areas have their own unique technical challenges for researchers to broach throughout the life cycle of comparative efficacy analyses.</p>
        <p>Computational models from machine learning and artificial intelligence have experienced success in early disease diagnosis and trial recruitment across several indications [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Challenges in trial recruitment have led researchers to generate computational models for patient identification, but they have faced difficulties due to lengthy diagnosis procedures, multiple physicians, and lack of gold standard–confirmed diagnoses to train models [<xref ref-type="bibr" rid="ref23">23</xref>]. In scenarios where there is interest in rare diseases with a long disease course, these challenges can often be exacerbated due to the need for sufficient long-term follow-up data. Efforts to increase the use of data sharing in rare diseases, such as the use of FAIR (findable, accessible, interoperable, and reusable) Guiding Principles for implantation networks (eg, Global Open FAIR Implementation Network), aim to produce a conjoined effort to create data sources fit for translational research [<xref ref-type="bibr" rid="ref24">24</xref>]. In many instances, patient identification within EHRs begins with the use of existing standard terminologies, such as the International Classification of Diseases (ICD) and the Systematized Nomenclature of Medicine – Clinical Terms (SNOMED CT). For many common comorbidities, these coding strategies have been adopted into general administrative practice but have fallen short when classifying rare diseases. A study evaluating 6519 rare diseases considered the International Classification of Diseases, 9th Revision, Clinical Modification (ICD-9-CM), International Classification of Diseases, 10th Revision, Clinical Modification (ICD-10-CM), and SNOMED CT, and found varying levels of coverage matching to a unique rare disease at 62%, 73%, and 85%, respectively [<xref ref-type="bibr" rid="ref25">25</xref>]. With diseases being mapped to multiple ICD codes, a single representation may not constitute an accurate diagnosis. Increased coverage of rare diseases in coding languages has been acknowledged and incorporated in the International Classification of Diseases, 11th Revision (ICD-11) released in 2022, with 10 times more rare disease classifiers than the previous version [<xref ref-type="bibr" rid="ref26">26</xref>]. Additional challenges related to executing machine learning and artificial intelligence initiatives arise due to several ethical and legal concerns, including consent for data use, transparency of algorithms, liability, and cyber security [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. Given the adaptive nature, the FDA has released guidance and a proposed regulatory framework, mainly in relation to medical devices and decision support software, to enable development of these technologies while maintaining safety and oversight for transparency and performance [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. Equivalent guidance has yet to be established for similar initiatives involving comparative effectiveness studies using real-world data. Similarly, advanced procedures for the diagnosis of rare diseases, such as whole genome sequencing (WGS) and advanced imaging, may not be sufficiently captured within EHRs. Initiatives surrounding WGS in particular are being developed to improve the storage, knowledge, and presentation of genomic information within EHR systems to increase use [<xref ref-type="bibr" rid="ref31">31</xref>]. Despite the increase in coverage, the implementation of these coding strategies, conversion of previous ICD codes within EHR systems, and incorporation of advanced technologies will add an additional level of complexity for EHR-based studies.</p>
        <p>Outside of traditional rare diseases, adoption of real-world data for comparative efficacy remains underutilized in certain categories, such as the incorporation of medications or surgical procedures in clinical trial conduct [<xref ref-type="bibr" rid="ref32">32</xref>]. Similarly, the ability to replicate clinical trials based on real-world data alone continues to be an area to improve, as many replication failures can be attributed to analyzing endpoints not typically found in real-world data, requiring data that are unlikely to appear in a structured form, lack of complete medical history, or difficulties in closely emulating a placebo [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. From herein, we focus on the following common challenges: outcome and covariate challenges, follow-up, time selection, and geography.</p>
      </sec>
      <sec>
        <title>Outcome and Covariate Challenges</title>
        <p>In a traditional clinical trial, there are frameworks present for outcome ascertainment and frequency through defined protocols for the monitoring and timing of key observations to evaluate clinical effectiveness. Given the structured nature of data from RCTs, analyses using these are seldom hampered by high levels of missingness or stochastic outcome measurements. In the context of real-world data and external control arms, a common challenge encountered is addressing the mindset of researchers to be open to the value of real-world data and the ability to develop suitable outcome proxies due to insufficient data availability.</p>
        <p>EHR systems were not designed for use in the same structured trial environment for clinical effectiveness studies; therefore, additional steps are required to refine data sets for use. EHR data include routinely collected measurements from general practice, which may not exactly match defined clinical endpoints of interest or disease definitions as encountered in clinical trials. Accordingly, where analyses attempt to align these data for comparative efficacy, issues may arise. In these cases, plausible proxies need to be made. For example, a trial of interest in a hepatology setting might include an outcome for “ascites requiring treatment;” however, in EHR data sets, “ascites” might be captured, but the condition with the additional criteria of requiring treatment would not be preassembled and indexed. Indeed, it would be possible to generate the treatments for ascites and tie these back to an individual patient, but this may be a manual process. As such, estimating the total number of eligible patients with the outcome of interest may be subject to substantial manual data curation. Specifically, in the context of using EHRs for comparisons to data obtained from a prospective clinical trial, there may be an absence of overlapping outcomes. Clinical trials (randomized or single-arm) have been found to often capture data on outcomes not recorded routinely in clinical practice [<xref ref-type="bibr" rid="ref34">34</xref>].</p>
        <p>Similarly, the translation of many gold standard trial endpoints to real-world data initiatives may not always be a straightforward endeavor. These efforts require a series of methodological considerations during the planning, abstraction, and analysis phases to ensure regulatory-grade fit-for-purpose data [<xref ref-type="bibr" rid="ref35">35</xref>]. Even where data may be recorded and decisions made consistent with clinical trials, there may be differences with respect to the timing and process of testing, which may influence the availability of testing. In clinical trials of solid tumors, the Response Evaluation Criteria in Solid Tumors (RECIST) are often used to define endpoints of progression-free survival (PFS) or objective response. However, the ability to operationalize the RECIST for retrospective analysis can be hindered due to lack of consistency in imaging reports in community practices [<xref ref-type="bibr" rid="ref36">36</xref>]. The RECIST are partially qualitative measurements, and physicians or patients in clinical practice are not blinded to the treatment, providing another difference from a clinical trial environment. Where clinical trials may make assessments for progression on a scheduled basis, real-world settings often only do so when there is an indication of progression, generally resulting in a misalignment of timing when attempts are made to draw comparisons. The real-world equivalents of many clinical trial endpoints, such as PFS and objective response rate, may not be generated using the same level of standardization or may result in variations in assessment criteria between diagnosing physicians in comparison to when performed within a clinical trial setting. For indications with good survival, such as early stage breast cancer, surrogate endpoints have been influential in allowing for reduced development time, smaller patient populations, and shorter follow-up time [<xref ref-type="bibr" rid="ref37">37</xref>]. Surrogate endpoints, such as pathologic complete response, would require the same level of attention as long-term outcomes to adequately define a real-world equivalent. As many surrogate endpoints for topics, such as oncology, remain controversial due to questions over their direct correlation to assess patient survival, their applications from real-world data are subject to similar criticism [<xref ref-type="bibr" rid="ref38">38</xref>]. Real-world data–based surrogate endpoints require thorough validation and can often involve timely procedures to abstract adequate data for ascertainment [<xref ref-type="bibr" rid="ref39">39</xref>].</p>
        <p>Other endpoints of interest, such as overall survival, may be clearly definable within a given data set, but are subject to limitations such as use restriction, delayed data availability, and missingness [<xref ref-type="bibr" rid="ref40">40</xref>]. For example, in acute lymphoblastic leukemia, the concept of “fit-for-use” EHR data was evaluated by assessing the data suitability prior to examination of any survival-based outcomes [<xref ref-type="bibr" rid="ref41">41</xref>]. Using a defined data quality assessment framework, data variables, such as diagnoses and demographics, were extracted and defined from EHRs over 70% of the time, but the approach fell short when categorizing laboratory values and death data, resulting in a high degree of missingness for these variables [<xref ref-type="bibr" rid="ref41">41</xref>]. As such, when considering data missingness, it is important not to simply restrict the evaluation to availability versus nonavailability of data, but also consider the frequency of assessments and overall data suitability. While much of the current literature has focused on oncological examples and survival-based outcomes, similar considerations can be granted to other outcomes, such as adverse events, and assessment of the balance between efficacy and clinical benefit.</p>
      </sec>
      <sec>
        <title>Follow-up</title>
        <p>Real-world studies provide an opportunity to offer additional insights into the patient journey by providing a reflection of traditional care. In an RCT setting, long-term follow-up can be constrained by financial hurdles and trial logistics. To mitigate this, randomized trials have been extended by incorporating long-term follow-ups augmented using routinely collected health care data to investigate long-term outcomes [<xref ref-type="bibr" rid="ref42">42</xref>]. In these contexts, there may be somewhat broader observation windows than in traditional RCTs, and there are still predefined study visits, follow-up criteria, and study investigators ensuring consistency of follow-up. In contrast, patients in general practice demonstrate higher variability with respect to their follow-up times and their frequency of follow-up visits. Patients’ frequency of visits may be heavily correlated with the severity of their condition or diagnosis, resulting in potential biases for follow-up times. Specifically considering this in the context of time-to-event outcomes, imbalances in follow-up frequency can result in biased estimations of relative treatment effects [<xref ref-type="bibr" rid="ref43">43</xref>]. Empirically, this has been demonstrated with observational data, and showing the level of follow-up completeness has been influential in the accuracy of survival estimates [<xref ref-type="bibr" rid="ref44">44</xref>]. In this example, simple reporting standardization of study follow-up, including in general practice, was found to be influential in outcome assessments, with a lack of systematic follow-up resulting in an underestimation of mortality [<xref ref-type="bibr" rid="ref44">44</xref>]. Similarly, the frequency of assessment scans has been shown to be associated with higher median PFS for both treated and untreated populations [<xref ref-type="bibr" rid="ref45">45</xref>]. As such, where assessments of PFS are made using real-world data with low or high frequency of assessments relative to the comparator data, the potential for bias may be high. In addition to visit frequency, the United States has additional hurdles contributing to the lack of sufficient follow-up data due to clinicians experiencing a higher administrative burden when using EHR systems in comparison to other countries, discontinuity resulting from out-of-system care, and a direct relationship with enrollment in health care insurance [<xref ref-type="bibr" rid="ref46">46</xref>-<xref ref-type="bibr" rid="ref48">48</xref>]. The value of incorporating real-world data into a framework to be considered as evidence for future extension studies has been recognized and endorsed by agencies such as the International Society for Pharmacoepidemiology [<xref ref-type="bibr" rid="ref49">49</xref>].</p>
      </sec>
      <sec>
        <title>Time Selection Challenges</title>
        <p>Unlike in randomized controlled comparative efficacy studies, the definition of start date for measuring patient outcomes can be challenging in routinely collected health data. The concept of immortal time bias originated in the 1970s and is termed to account for the period of time within an observational or follow-up period of a cohort where the study outcome of interest cannot occur [<xref ref-type="bibr" rid="ref50">50</xref>]. When unaccounted for, EHR studies can be prone to immortal time bias, and this phenomenon has been demonstrated in observational studies of long-term conditions [<xref ref-type="bibr" rid="ref51">51</xref>]. For example, clinical trials may often be established to evaluate a therapy within a population having an existing therapeutic history, which is often referred to as a line of therapy. There may be limits with respect to the total lines of therapy, but they are otherwise permissive with respect to treatment lines or may even use treatment lines as a stratification factor. In routinely collected health data, this presents a challenge for patients with multiple lines of therapy, who are “multiply eligible” for the trial of interest. For a patient who has received 4 lines of therapy, which line of therapy should be considered their index date? Patients could be selected according to their most recent line of therapy or oldest line of therapy, or there could be a random selection of the therapy line. Each of these may have an influence on the associated outcomes, particularly those that may have a time-varying frequency. Hernan and Robins proposed several approaches within the context of target trial emulation. It has been proposed to use a single time zero, a randomly selected time zero, or all available time zeros for a given patient [<xref ref-type="bibr" rid="ref52">52</xref>]. Within the context of a comparative efficacy analysis using external trial data, these approaches may not be as interchangeable. Indeed, simulation-based research in an oncology context identified that the use of either random line selection or the last line of therapy was subject to substantial inflation in type I error when compared to the use of all available lines of therapy [<xref ref-type="bibr" rid="ref53">53</xref>]. As such, careful selection of the index date should be applied as decisions may substantially alter the associated inferences available.</p>
        <p>Related to these issues are those representing general temporal biases associated with discordant timeframes of interest. While statistical methodologies may be used to minimize observable between-group differences, other aspects of care may vary over time in ways that cannot be accounted for in such a direct manner. For example, even where diagnostic criteria for a condition do not vary over the time period of interest, access to the requisite diagnostic technology may increase over time, leading to increased disease incidence outside of any other changes to practice. These patients may differ from patients identified at different times with respect to both measurable and unmeasurable characteristics, which may contribute to temporal bias [<xref ref-type="bibr" rid="ref54">54</xref>]. This is separate from more clear-cut temporal bias, which may occur when diagnostic criteria change for patients, standards of care vary over time, or important prognostic factors of significance are identified, and it would need to be adequately accounted for. Finally, these changes in practice over time may result in essential covariates or populations of interest being simply unavailable owing to evolution of the standard of care.</p>
        <p>Indeed, concerns regarding temporal bias have formed the basis of negative reception in regulatory submissions using external data for the FDA, the EMA, and Health Canada [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref56">56</xref>]. Statistical approaches exist to identify time-varying confounding [<xref ref-type="bibr" rid="ref54">54</xref>], though these are predominantly for exploring the existence of such confounding, rather than to minimize their impact. As such, where possible, it is important to achieve close alignment with respect to the timeline of interest, and where this is not possible, it is important to identify covariates that may influence the differences in dates.</p>
      </sec>
      <sec>
        <title>Geographical Context</title>
        <p>Conditional on the circumstances associated with the application of an external control, geographic representation may be an important characteristic to consider. Regulatory and reimbursement bodies have often identified geographic discordance as part of the rationale behind negative endorsement of candidate products, particularly where these geographic differences are likely to translate to differences in prognostic factors, confounding, effect modifiers, and standards of care [<xref ref-type="bibr" rid="ref57">57</xref>]. Management of these issues can be minimized through ensuring specificity of the geographic source of the data of interest to ensure consistency with the target trial of interest. This may not be possible in all instances. Real-world data may be abundant in high-income countries (eg, countries in North America and Europe) but can be significantly lacking in many low- and middle-income countries due to lack of EHRs, agreement between stakeholders, and regulation to support the generation and use of secondary data [<xref ref-type="bibr" rid="ref58">58</xref>]. The commercialization of data from many high-income countries has made identification more attainable, but given that there is no organization dedicated to the tracking of sources in low- and middle-income countries, barriers remain for researchers to identify these sources with ease [<xref ref-type="bibr" rid="ref59">59</xref>]. Further compounding these issues is the substantial variations with respect to the availability of data in certain geographies owing to the varying legal frameworks associated with the use of patient data and differences in language. Efforts to address the ability to generalize study inferences outside of the intended study population of a geography to another is an emerging topic of interest known as transportability, and it has shown success under special circumstances [<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref61">61</xref>]. Despite advancement, geography remains a concern for researchers to contend with when wanting to have sufficient population coverage across high- and low-income countries.</p>
      </sec>
    </sec>
    <sec>
      <title>Solutions: How Can Challenges Be Minimized?</title>
      <sec>
        <title>Solution 1: Transparent Prespecified Description of Data Element Definitions and a Detailed Data Analysis Plan</title>
        <p>The abundance of real-world data certainly presents a vast set of challenges, including “data dredging” where the hoped-for result may stem from ad hoc data mining or from selection of one of the many data sources with limited characteristics for adjustment [<xref ref-type="bibr" rid="ref62">62</xref>-<xref ref-type="bibr" rid="ref65">65</xref>]. With the large quantities of available real-world data across the United States and Europe, data sets can conceivably be stratified and matched in ways that could provide favorable results in an opaque manner. To mitigate this, solutions have been presented by regulatory bodies and academic groups for improving transparency for comparative efficacy exercises using real-world data. FDA guidance specifically calls out that study design elements, including data source definitions of all data elements and analyses, should be prespecified prior to analysis, and encourages groups submitting to partake in preanalysis discussions early in the drug development program about whether conducting an externally controlled trial instead of an RCT is reasonable [<xref ref-type="bibr" rid="ref7">7</xref>]. Academic groups, such as the International Society for Pharmacoeconomics and Outcomes Research (ISPOR) task force, also have guidance on good practices for real-world data studies of treatment effectiveness [<xref ref-type="bibr" rid="ref66">66</xref>]. The provided advice is to have a transparent and systematic review process of combing through the data source availability and matching to trial characteristics.</p>
        <p>The intended steps of using real-world data to evaluate clinical efficacy should be discussed or described in a protocol and statistical analysis plan (SAP) with the associated regulatory or reimbursement body ahead of initiating the externally controlled trial, in an effort to not “cherry pick” the results. Here, sponsors should include a justification for selecting or excluding relevant data sources and should demonstrate that the choice of the final data source for the control arm best answers the research question of interest [<xref ref-type="bibr" rid="ref7">7</xref>]. Further, it would be imperative to describe how the relevant EHR data were extracted and imported into the sponsor’s electronic system, and how the data obtained from EHRs are consistent with the data collection specified in the clinical trial protocol.</p>
        <p>FDA guidance specifies that the protocol and SAP that will be submitted following initial discussions should describe the data provenance curation and transformation procedures in the final study-specific analytic data set and describe how processes could affect data integrity (consistency of data and completeness) and overall study validity [<xref ref-type="bibr" rid="ref3">3</xref>]. Given the origin of real-world data, SAPs should also specify all proposed sensitivity analyses or quantitative bias analyses as suggested by FDA guidance documentation to address the influence of outcome misclassification and unmeasured confounders in order to ensure appropriate conclusions are drawn [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Taken together, prespecifying data source collection methods, data element availability, and data integrity to regulatory authorities before conducting any analyses can provide transparency regarding the upcoming efficacy analyses and provide a solution to data mining.</p>
        <p>One approach to doing this is to define the patient population for the external control arm, specify the outcome of interest, identify prognostic factors associated with the outcome of interest, and specify the control therapy. During the data source identification phase of the study, it may be common to undertake a scoping exercise to understand the breadth of data available and decipher top-level patient counts. From these selection criteria, data sets that do not have available data for elements of interest can be excluded. The derived top-level counts will reduce as further matching with trial selection criteria is applied. It is an iterative process to assess the best data source that will have sufficient patient counts and covariates to confirm a match, by assessing the strengths and limitations of each of these data sources simultaneously. Since the identification of a suitable real-world data database is an iterative process when proposing the external control arm to regulators at the time of filing for regulatory discussions, a prespecified description of the database is suggested to inform regulators, but a major limitation is that some data element criteria might be unknown until further exploration [<xref ref-type="bibr" rid="ref7">7</xref>]. Among included data sets, assessments may be made for sample size estimates of the closest resemblance to the effective population and data missingness. The data sets with the highest effective sample size and better coverage of data elements are considered for a feasibility assessment with a deeper look at the data. Through tokenization or other methodologies, multiple data sources could also be used to get more complete patient health care data, follow-up information, and geographic coverage.</p>
      </sec>
      <sec>
        <title>Solution 2: Data Collection Leveraging Real-World Data</title>
        <p>Situations where existing data are not available or suitable for an indication, a necessary exposure, an outcome, or a key covariate to measure confounding from sources, can pose a major limitation to conducting comparative efficacy studies to support regulatory decisions. As other researchers have stated, a common external control arm critique is about the mitigation of confounding [<xref ref-type="bibr" rid="ref16">16</xref>]. Unfortunately, there are limits to ascertain real-world data proxies for variables in historically collected databases. This could also be problematic when a group may wish to minimize temporal bias due to changes in the standard of care when using older data, by restricting the dates of eligible patients. This in turn could result in low sample sizes of well-matched control patients.</p>
        <p>A possible solution for these issues is to conduct de novo retrospective data collection where there would be manual review of patient charts, in conjunction with pre-existing data. Here, clinicians and key experts for the indication create a customized data collection form (also known as an electronic case record form) that can be standardized across multiple sites and gather useful details. In these scenarios, assessments can be obtained and linked directly to events of interest, such as a new medication or an annual physical examination. As EHR databases can provide access to longitudinal data, further evaluation of measures both before and after the event window can be performed. Drawing upon these aspects further emphasizes the value of real-world data to contribute to both predictive analytics and assessment of long-term outcomes in comparative effectiveness analyses.</p>
        <p>De novo data capture will not fix challenges in relation to the frequency of visits or collection of variables known to exist exclusively within trial settings, which is a limitation of this solution. However, qualitative assessments and clinical narratives can contain valuable insights absent from the structured data fields of EHRs. Improvements in advanced analytics and natural language processing have provided increased automation to abstract valuable clinical information from unstructured fields, which is traditionally time consuming. A direct comparison between machine learning review and chart-based review in the diagnosis of rheumatoid arthritis demonstrated the ability of the algorithm to identify patients with a strong overlap in disease classification criteria and baseline disease characteristics [<xref ref-type="bibr" rid="ref67">67</xref>]. On the contrary, missing data and poor data quality can introduce bias in automated methods, and variability in models can limit comparisons [<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref69">69</xref>]. Commercial data providers have realized the potential of custom abstraction projects incorporating both manual and automated abstraction to increase the availability of data outside of structured fields, as well as algorithms to calculate real-world endpoints in product offerings.</p>
      </sec>
      <sec>
        <title>Solution 3: Record Linkage/Tokenization</title>
        <p>The ability to characterize the entire patient journey is critical to perform clinical effectiveness analyses using real-world data, though a complete picture of a patient’s medical health is often not available within a single data source. Patients who move in and out of health care networks could have their data omitted from analyses of single data sets. If this movement is related to the patient’s standard of care or access to treatment, the process can result in unintended biases in an analysis that is unable to account for these patient movements and missing data. A solution to the fragmentation of the patient journey and perspective could be to engage with data providers who tokenize their data set. In tokenized data sets, patient “tokens” or unique identifiers are assigned to link a patient within a given data source to assist identification in other separate real-world data sources, avoiding duplication while protecting patient privacy at the same time [<xref ref-type="bibr" rid="ref70">70</xref>]. Tokenization and record linkage can aid in this endeavor and have been recognized by regulators through inclusion in draft guidelines to provide considerations when performing data linkage to ensure a comprehensive data set, quantification of errors, and resolution of discrepancies [<xref ref-type="bibr" rid="ref3">3</xref>]. Similarly, initiatives have been developed to combine machine learning methodologies and tokenization to expand upon use for EHR analysis, while drawing attention to areas needing improvement in patient phenotyping or patient identification for research purposes [<xref ref-type="bibr" rid="ref71">71</xref>].</p>
        <p>Examples of the role of tokenization have been identified for broadening data sets to improve associations of testing with outcomes in diseases such as COVID-19 [<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref73">73</xref>]. While these approaches may be applicable in select cases, it is important to note that not all data sources are capable of linking data due to privacy concerns regarding indirect personal data and data ownership, and additional challenges due to differences in language. These themes highlight the potential limitations that can arise when considering linkage and tokenization to aid in downstream analyses. In turn, this necessitates a flexible approach to data identification and consideration of which approaches of further data acquisition are available for a given project.</p>
      </sec>
    </sec>
    <sec>
      <title>Summary of Real-World Data Identification Challenges and Case Studies</title>
      <p>Every scenario in identifying a suitable real-world data source as an external control arm for comparative efficacy is unique. The solution of tokenization, for example, could work in some instances, but might not be appropriate in cases where complete coverage of data is available, though the definitions in the data set are poorly defined in the external data source. <xref ref-type="table" rid="table1">Table 1</xref> lists the challenges that frequently arise in these data landscaping exercises and summarizes some examples of solutions or case studies for further reading.</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Summary of real-world data identification for comparative efficacy using externally controlled trial challenges, examples, and application of solutions.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="270"/>
          <col width="0"/>
          <col width="360"/>
          <col width="0"/>
          <col width="340"/>
          <thead>
            <tr valign="top">
              <td colspan="3">Challenges</td>
              <td colspan="2">Examples</td>
              <td>Application of solutions</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="5">
                <bold>Data source identification of rare conditions</bold>
              </td>
              <td>
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Indecision gaps due to abundance of real-world data</td>
              <td colspan="2">It is difficult to parse out important data sources, rare disease candidates, and data linkage options.</td>
              <td colspan="2">Machine learning applications can improve accuracy and quality (type and frequency) in data source selection and patient selection [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref71">71</xref>]</td>
            </tr>
            <tr valign="top">
              <td colspan="3">
                <bold>Outcome and covariate</bold>
              </td>
              <td colspan="2">
                <break/>
              </td>
              <td>
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Poorly defined variables or inconsistent definitions from clinical trial to real-world data for limited comparability of real-world data</td>
              <td colspan="2">The conceptual definition of a data element does not align with the operational definition.</td>
              <td colspan="2">
                <list list-type="bullet">
                  <list-item>
                    <p>De novo data collection [<xref ref-type="bibr" rid="ref74">74</xref>]</p>
                  </list-item>
                  <list-item>
                    <p>Automated electronic health record (EHR) abstraction [<xref ref-type="bibr" rid="ref69">69</xref>]</p>
                  </list-item>
                  <list-item>
                    <p>Characterization of real-world variables or surrogate endpoints [<xref ref-type="bibr" rid="ref75">75</xref>]</p>
                  </list-item>
                  <list-item>
                    <p>Prespecify sensitivity analyses, including quantitative bias analyses [<xref ref-type="bibr" rid="ref76">76</xref>], in the statistical analysis plan</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Medical claims data might have limited use to support regulatory-grade decision-making</td>
              <td colspan="2">Claims data have limited clinical outcome data.</td>
              <td colspan="2">Combine with EHRs to expand the applicability, coverage, and depth of data [<xref ref-type="bibr" rid="ref77">77</xref>]</td>
            </tr>
            <tr valign="top">
              <td colspan="3">
                <bold>Follow-up</bold>
              </td>
              <td colspan="2">
                <break/>
              </td>
              <td>
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Difficult to capture continuity of care in a single data source</td>
              <td colspan="2">Diagnosis is spread across multiple physicians; if the patient moves and seeks care outside of the care network, follow-up data will be lost.</td>
              <td colspan="2">
                <list list-type="bullet">
                  <list-item>
                    <p>Tokenization/data linkage and advanced analytics with EHR data for capturing a more complete patient journey (particularly helpful for rare conditions where the sample size would be low) [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref71">71</xref>]</p>
                  </list-item>
                  <list-item>
                    <p>Analytical approaches (ie, imputation) for missing data [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref71">71</xref>,<xref ref-type="bibr" rid="ref78">78</xref>]</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="3">
                <bold>Time selection</bold>
              </td>
              <td colspan="2">
                <break/>
              </td>
              <td>
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Timing of therapy</td>
              <td colspan="2">Patient has multiple lines of treatment; what should be considered the index date?</td>
              <td colspan="2">Define a proper index date or “time zero” following the target trial emulation framework [<xref ref-type="bibr" rid="ref52">52</xref>]</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Timing of data collection – inconsistent standard of care over time</td>
              <td colspan="2">Data may be present, but are not current enough to provide a reasonable comparison to the current standard of care.</td>
              <td colspan="2">
                <list list-type="bullet">
                  <list-item>
                    <p>De novo data collection [<xref ref-type="bibr" rid="ref55">55</xref>]</p>
                  </list-item>
                  <list-item>
                    <p>Tokenization/data linkage [<xref ref-type="bibr" rid="ref78">78</xref>]</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="3">
                <bold>Geography</bold>
              </td>
              <td colspan="2">
                <break/>
              </td>
              <td>
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>External control arm nongeneralizable to clinical practice</td>
              <td colspan="2">Geographic representation where the main external control arm data source is from outside of the country of interest. Select two unlinked data sources with available data to obtain a sufficient sample size. However, it is unclear if patients overlap in care networks.</td>
              <td colspan="2">
                <list list-type="bullet">
                  <list-item>
                    <p>Tokenization/data linkage, which improves patient counts with geographic representation while accounting for duplicates [<xref ref-type="bibr" rid="ref79">79</xref>]</p>
                  </list-item>
                  <list-item>
                    <p>Transportability [<xref ref-type="bibr" rid="ref60">60</xref>]</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="3">
                <bold>Analysis phase</bold>
              </td>
              <td colspan="2">
                <break/>
              </td>
              <td>
                <break/>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Data loss or insufficient sample size to detect power</td>
              <td colspan="2">In the analysis phase, during matching, the power to detect an effect is reduced.</td>
              <td colspan="2">
                <list list-type="bullet">
                  <list-item>
                    <p>De novo data collection [<xref ref-type="bibr" rid="ref55">55</xref>]</p>
                  </list-item>
                  <list-item>
                    <p>Tokenization/data linkage [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref44">44</xref>]</p>
                  </list-item>
                  <list-item>
                    <p>Analytical approaches (ie, imputation) for missing data [<xref ref-type="bibr" rid="ref78">78</xref>]</p>
                  </list-item>
                </list>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Avoid the appearance of the analysis as post-hoc or cherry picked</td>
              <td colspan="2">Data dredging/post-hoc analysis (eg, regulators can assume the most appealing analysis was conducted).</td>
              <td colspan="2">Transparent prespecified description of data selection, data provenance, and the statistical analysis plan [<xref ref-type="bibr" rid="ref3">3</xref>]</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
    </sec>
    <sec>
      <title>Conclusion</title>
      <p>Given the considerable costs of novel drug development pipelines and the increasing stratification of diseases and subtypes, real-world data will become increasingly relevant for regulatory and reimbursement discussions in the decades to come. Exclusive reliance on an RCT framework as the entire evidence generation plan does not adequately acknowledge the shortcomings of a singular research strategy, despite the advantages for comparative efficacy research. Simultaneously, the field of biostatistics has expanded to focus on data missingness to allow effectiveness analyses when a subject presents with incomplete data, while taking the necessary precautions and accounting for bias.</p>
      <p>The versatility of the use of real-world data extends beyond its use in comparative efficacy analyses. There are additional concerns with safety, which have postmarket authorization requirement differences. Similarly, important topics outside the scope of this paper include the many challenges associated with patient privacy and reidentification risk, and the necessary consideration needed when performing these analyses. EHR-based real-world data were the focus of this paper, but additional sources have been successful in comparative efficacy analyses. Claims, like other sources of real-world data, have their own unique challenges for consideration [<xref ref-type="bibr" rid="ref80">80</xref>], but have demonstrated success in clinical effectiveness studies and in rare disease studies [<xref ref-type="bibr" rid="ref77">77</xref>,<xref ref-type="bibr" rid="ref81">81</xref>,<xref ref-type="bibr" rid="ref82">82</xref>]. Conjoined efforts, such as those between the ISPOR and the International Society for Pharmaceutical Engineering, have provided recommendations to highlight the need for transparency in planning and reporting of observational real-world evidence studies and comparative effectiveness studies [<xref ref-type="bibr" rid="ref66">66</xref>]. Although real-world evidence based on real-world data studies is critical to the operation of providing timely insights into what works for patients and when, the identification and evaluation of real-world data sources for comparative effectiveness studies have many challenges. The solutions suggested in this paper could minimize these challenges; however, the selection and evaluation of a good real-world data source is not as straightforward as it may appear.</p>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">EMA</term>
          <def>
            <p>European Medicines Agency</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">FAIR</term>
          <def>
            <p>findable, accessible, interoperable, and reusable</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">FDA</term>
          <def>
            <p>Food and Drug Administration</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ICD</term>
          <def>
            <p>International Classification of Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">ISPOR</term>
          <def>
            <p>International Society for Pharmacoeconomics and Outcomes Research</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">PFS</term>
          <def>
            <p>progression-free survival</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">RCT</term>
          <def>
            <p>randomized controlled trial</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">RECIST</term>
          <def>
            <p>Response Evaluation Criteria in Solid Tumors</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">SAP</term>
          <def>
            <p>statistical analysis plan</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">SNOMED CT</term>
          <def>
            <p>Systematized Nomenclature of Medicine – Clinical Terms</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">WGS</term>
          <def>
            <p>whole genome sequencing</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>RRV, CM, and LD work for Cytel Inc (paid employment). RRV and LD have shares of Cytel Inc. EAS and LE work for Nashville Biosciences (paid employment). DRB has no conflicts to declare.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mahendraratnam</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mercon</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gill</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Benzing</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>McClellan</surname>
              <given-names>MB</given-names>
            </name>
          </person-group>
          <article-title>Understanding Use of Real-World Data and Real-World Evidence to Support Regulatory Decisions on Medical Product Effectiveness</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2022</year>
          <month>01</month>
          <volume>111</volume>
          <issue>1</issue>
          <fpage>150</fpage>
          <lpage>154</lpage>
          <pub-id pub-id-type="doi">10.1002/cpt.2272</pub-id>
          <pub-id pub-id-type="medline">33891318</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gabay</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>21st Century Cures Act</article-title>
          <source>Hosp Pharm</source>
          <year>2017</year>
          <month>04</month>
          <volume>52</volume>
          <issue>4</issue>
          <fpage>264</fpage>
          <lpage>265</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28515504"/>
          </comment>
          <pub-id pub-id-type="doi">10.1310/hpj5204-264</pub-id>
          <pub-id pub-id-type="medline">28515504</pub-id>
          <pub-id pub-id-type="pmcid">PMC5424829</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <article-title>Real-World Data: Assessing Electronic Health Records and Medical Claims Data To Support Regulatory Decision-Making for Drug and Biological Products - Draft Guidance for Industry</article-title>
          <source>Food and Drug Administration</source>
          <access-date>2023-02-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fda.gov/regulatory-information/search-fda-guidance-documents/real-world-data-assessing-electronic-health-records-and-medical-claims-data-support-regulatory">https://www.fda.gov/regulatory-information/search-fda-guidance-documents/real-world-data-assessing-electronic-health-records-and-medical-claims-data-support-regulatory</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <article-title>CHMP Guideline on registry-based studies</article-title>
          <source>European Medicines Agency</source>
          <access-date>2023-02-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.encepp.eu/publications/documents/3_KellyPlueschke_CHMPGuidelineonregistry-basedstudies.pdf">https://www.encepp.eu/publications/documents/3_KellyPlueschke_CHMPGuidelineonregistry-basedstudies.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="web">
          <article-title>NICE real-world evidence framework</article-title>
          <source>National Institute for Health and Care Excellence</source>
          <access-date>2023-02-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nice.org.uk/corporate/ecd9/chapter/overview">https://www.nice.org.uk/corporate/ecd9/chapter/overview</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
          <article-title>E10 Choice of Control Group and Related Issues in Clinical Trials</article-title>
          <source>ICH Expert Working Group</source>
          <year>2000</year>
          <month>07</month>
          <day>20</day>
          <access-date>2023-02-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://database.ich.org/sites/default/files/E10_Guideline.pdf">https://database.ich.org/sites/default/files/E10_Guideline.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <article-title>Considerations for the Design and Conduct of Externally Controlled Trials for Drug and Biological Products</article-title>
          <source>Food and Drug Administration</source>
          <access-date>2023-02-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fda.gov/regulatory-information/search-fda-guidance-documents/considerations-design-and-conduct-externally-controlled-trials-drug-and-biological-products">https://www.fda.gov/regulatory-information/search-fda-guidance-documents/considerations-design-and-conduct-externally-controlled-trials-drug-and-biological-products</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <article-title>Use of Electronic Health Record Data in Clinical Investigations Guidance for Industry</article-title>
          <source>Food and Drug Administration</source>
          <access-date>2023-02-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fda.gov/regulatory-information/search-fda-guidance-documents/use-electronic-health-record-data-clinical-investigations-guidance-industry">https://www.fda.gov/regulatory-information/search-fda-guidance-documents/use-electronic-health-record-data-clinical-investigations-guidance-industry</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maruszczyk</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Aiyegbusi</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Cardoso</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Gkoutos</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Slater</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Collis</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Keeley</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Calvert</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Implementation of patient-reported outcome measures in real-world evidence studies: Analysis of ClinicalTrials.gov records (1999-2021)</article-title>
          <source>Contemp Clin Trials</source>
          <year>2022</year>
          <month>09</month>
          <volume>120</volume>
          <fpage>106882</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1551-7144(22)00208-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cct.2022.106882</pub-id>
          <pub-id pub-id-type="medline">35973663</pub-id>
          <pub-id pub-id-type="pii">S1551-7144(22)00208-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huhn</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Matzke</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Koch</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gunga</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Maggioni</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Sié</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Boudo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Ouedraogo</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Compaoré</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bunker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sauerborn</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bärnighausen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Barteit</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Using wearable devices to generate real-world, individual-level data in rural, low-resource contexts in Burkina Faso, Africa: A case study</article-title>
          <source>Front Public Health</source>
          <year>2022</year>
          <month>9</month>
          <day>30</day>
          <volume>10</volume>
          <fpage>972177</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://air.unimi.it/handle/2434/941740"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpubh.2022.972177</pub-id>
          <pub-id pub-id-type="medline">36249225</pub-id>
          <pub-id pub-id-type="pmcid">PMC9561896</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Barrett</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Leonardi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Roychoudhury</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Trifillis</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Natural History and Real-World Data in Rare Diseases: Applications, Limitations, and Future Perspectives</article-title>
          <source>J Clin Pharmacol</source>
          <year>2022</year>
          <month>12</month>
          <volume>62 Suppl 2</volume>
          <fpage>S38</fpage>
          <lpage>S55</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/jcph.2134"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/jcph.2134</pub-id>
          <pub-id pub-id-type="medline">36461748</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baumfeld Andre</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Reynolds</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Caubel</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Azoulay</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dreyer</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Trial designs using real-world data: The changing landscape of the regulatory approval process</article-title>
          <source>Pharmacoepidemiol Drug Saf</source>
          <year>2020</year>
          <month>10</month>
          <volume>29</volume>
          <issue>10</issue>
          <fpage>1201</fpage>
          <lpage>1212</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31823482"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/pds.4932</pub-id>
          <pub-id pub-id-type="medline">31823482</pub-id>
          <pub-id pub-id-type="pmcid">PMC7687110</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ghadessi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Toyoizumi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>CQ</given-names>
            </name>
            <name name-style="western">
              <surname>Beckman</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>A roadmap to using historical controls in clinical trials - by Drug Information Association Adaptive Design Scientific Working Group (DIA-ADSWG)</article-title>
          <source>Orphanet J Rare Dis</source>
          <year>2020</year>
          <month>03</month>
          <day>12</day>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>69</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ojrd.biomedcentral.com/articles/10.1186/s13023-020-1332-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13023-020-1332-x</pub-id>
          <pub-id pub-id-type="medline">32164754</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13023-020-1332-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC7069184</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>RS</given-names>
            </name>
          </person-group>
          <article-title>Electronic Health Records: Then, Now, and in the Future</article-title>
          <source>Yearb Med Inform</source>
          <year>2016</year>
          <month>05</month>
          <day>20</day>
          <volume>Suppl 1</volume>
          <issue>Suppl 1</issue>
          <fpage>S48</fpage>
          <lpage>61</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.15265/IYS-2016-s006"/>
          </comment>
          <pub-id pub-id-type="doi">10.15265/IYS-2016-s006</pub-id>
          <pub-id pub-id-type="medline">27199197</pub-id>
          <pub-id pub-id-type="pii">me2016-s006</pub-id>
          <pub-id pub-id-type="pmcid">PMC5171496</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rahal</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Mercer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kuziemsky</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yaya</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Factors affecting the mature use of electronic medical records by primary care physicians: a systematic review</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2021</year>
          <month>02</month>
          <day>19</day>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>67</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-021-01434-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-021-01434-9</pub-id>
          <pub-id pub-id-type="medline">33607986</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-021-01434-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7893965</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jaksa</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Louder</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Maksymiuk</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Vondeling</surname>
              <given-names>GT</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gatto</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Richards</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Yver</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenlund</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A Comparison of Seven Oncology External Control Arm Case Studies: Critiques From Regulatory and Health Technology Assessment Agencies</article-title>
          <source>Value Health</source>
          <year>2022</year>
          <month>12</month>
          <volume>25</volume>
          <issue>12</issue>
          <fpage>1967</fpage>
          <lpage>1976</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1098-3015(22)02004-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jval.2022.05.016</pub-id>
          <pub-id pub-id-type="medline">35760714</pub-id>
          <pub-id pub-id-type="pii">S1098-3015(22)02004-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>RO</given-names>
            </name>
            <name name-style="western">
              <surname>McCowan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Montgomery</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Fahey</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>The external validity of published randomized controlled trials in primary care</article-title>
          <source>BMC Fam Pract</source>
          <year>2009</year>
          <month>01</month>
          <day>19</day>
          <volume>10</volume>
          <fpage>5</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcfampract.biomedcentral.com/articles/10.1186/1471-2296-10-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2296-10-5</pub-id>
          <pub-id pub-id-type="medline">19152681</pub-id>
          <pub-id pub-id-type="pii">1471-2296-10-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC2632986</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>BHY</given-names>
            </name>
            <name name-style="western">
              <surname>Chau</surname>
              <given-names>JFT</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>GK</given-names>
            </name>
          </person-group>
          <article-title>Rare versus common diseases: a false dichotomy in precision medicine</article-title>
          <source>NPJ Genom Med</source>
          <year>2021</year>
          <month>02</month>
          <day>24</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>19</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41525-021-00176-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41525-021-00176-x</pub-id>
          <pub-id pub-id-type="medline">33627657</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41525-021-00176-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC7904920</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Halley</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Ashley</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Goldenberg</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Tabor</surname>
              <given-names>HK</given-names>
            </name>
          </person-group>
          <article-title>A call for an integrated approach to improve efficiency, equity and sustainability in rare disease research in the United States</article-title>
          <source>Nat Genet</source>
          <year>2022</year>
          <month>03</month>
          <day>07</day>
          <volume>54</volume>
          <issue>3</issue>
          <fpage>219</fpage>
          <lpage>222</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35256804"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41588-022-01027-w</pub-id>
          <pub-id pub-id-type="medline">35256804</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41588-022-01027-w</pub-id>
          <pub-id pub-id-type="pmcid">PMC9016354</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kempf</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Goldsmith</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Temple</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Challenges of developing and conducting clinical trials in rare disorders</article-title>
          <source>Am J Med Genet A</source>
          <year>2018</year>
          <month>04</month>
          <volume>176</volume>
          <issue>4</issue>
          <fpage>773</fpage>
          <lpage>783</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/ajmg.a.38413"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/ajmg.a.38413</pub-id>
          <pub-id pub-id-type="medline">28815894</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Hogan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Shenkman</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Applications of artificial intelligence in drug development using real-world data</article-title>
          <source>Drug Discov Today</source>
          <year>2021</year>
          <month>05</month>
          <volume>26</volume>
          <issue>5</issue>
          <fpage>1256</fpage>
          <lpage>1264</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33358699"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.drudis.2020.12.013</pub-id>
          <pub-id pub-id-type="medline">33358699</pub-id>
          <pub-id pub-id-type="pii">S1359-6446(20)30531-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC8626864</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Koul</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Singla</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ijaz</surname>
              <given-names>MF</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in disease diagnosis: a systematic literature review, synthesizing framework and future research agenda</article-title>
          <source>J Ambient Intell Humaniz Comput</source>
          <year>2022</year>
          <month>01</month>
          <day>13</day>
          <fpage>1</fpage>
          <lpage>28</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35039756"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s12652-021-03612-z</pub-id>
          <pub-id pub-id-type="medline">35039756</pub-id>
          <pub-id pub-id-type="pii">3612</pub-id>
          <pub-id pub-id-type="pmcid">PMC8754556</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Colbaugh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Glass</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Rudolf</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tremblay Volv Global Lausanne Switzerland</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Learning to Identify Rare Disease Patients from Electronic Health Records</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <volume>2018</volume>
          <fpage>340</fpage>
          <lpage>347</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30815073"/>
          </comment>
          <pub-id pub-id-type="medline">30815073</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371307</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wilkinson</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Dumontier</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Aalbersberg</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Appleton</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Axton</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Baak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Blomberg</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Boiten</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>da Silva Santos</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>Bourne</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Bouwman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Brookes</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Crosas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dillo</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Dumon</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Edmunds</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Evelo</surname>
              <given-names>CT</given-names>
            </name>
            <name name-style="western">
              <surname>Finkers</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez-Beltran</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gray</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Groth</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Goble</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Grethe</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Heringa</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>'t Hoen</surname>
              <given-names>PAC</given-names>
            </name>
            <name name-style="western">
              <surname>Hooft</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kuhn</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kok</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kok</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lusher</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Martone</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Mons</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Packer</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Persson</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Rocca-Serra</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Roos</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>van Schaik</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sansone</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Schultes</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Sengstag</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Slater</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Strawn</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Swertz</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>van der Lei</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>van Mulligen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Velterop</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Waagmeester</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wittenburg</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wolstencroft</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mons</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>The FAIR Guiding Principles for scientific data management and stewardship</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <month>03</month>
          <day>15</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>160018</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/sdata.2016.18"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.18</pub-id>
          <pub-id pub-id-type="medline">26978244</pub-id>
          <pub-id pub-id-type="pii">sdata201618</pub-id>
          <pub-id pub-id-type="pmcid">PMC4792175</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fung</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Richesson</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bodenreider</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Coverage of rare disease names in standard terminologies and implications for patients, providers, and research</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2014</year>
          <volume>2014</volume>
          <fpage>564</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25954361"/>
          </comment>
          <pub-id pub-id-type="medline">25954361</pub-id>
          <pub-id pub-id-type="pmcid">PMC4419993</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aymé</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bellet</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Rath</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Rare diseases in ICD11: making rare diseases visible in health information systems through appropriate coding</article-title>
          <source>Orphanet J Rare Dis</source>
          <year>2015</year>
          <month>03</month>
          <day>26</day>
          <volume>10</volume>
          <fpage>35</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ojrd.biomedcentral.com/articles/10.1186/s13023-015-0251-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13023-015-0251-8</pub-id>
          <pub-id pub-id-type="medline">25887186</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13023-015-0251-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC4377208</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gerke</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Minssen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Bohr</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Memarzadeh</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Chapter 12 - Ethical and legal challenges of artificial intelligence-driven healthcare</article-title>
          <source>Artificial Intelligence in Healthcare</source>
          <year>2020</year>
          <publisher-loc>Cambridge, MA</publisher-loc>
          <publisher-name>Academic Press</publisher-name>
          <fpage>295</fpage>
          <lpage>336</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Baxter</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>The practical implementation of artificial intelligence technologies in medicine</article-title>
          <source>Nat Med</source>
          <year>2019</year>
          <month>01</month>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>30</fpage>
          <lpage>36</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30617336"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41591-018-0307-0</pub-id>
          <pub-id pub-id-type="medline">30617336</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-018-0307-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6995276</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <article-title>Clinical Decision Support Software - Guidance for Industry and Food and Drug Administration Staff</article-title>
          <source>Food and Drug Administration</source>
          <access-date>2023-02-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fda.gov/regulatory-information/search-fda-guidance-documents/clinical-decision-support-software">https://www.fda.gov/regulatory-information/search-fda-guidance-documents/clinical-decision-support-software</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
          <article-title>Proposed Regulatory Framework for Modifications to Artificial Intelligence/Machine Learning (AI/ML)-Based Software as a Medical Device (SaMD) - Discussion Paper and Request for Feedback</article-title>
          <source>Food and Drug Administration</source>
          <access-date>2023-02-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fda.gov/files/medical%20devices/published/US-FDA-Artificial-Intelligence-and-Machine-Learning-Discussion-Paper.pdf">https://www.fda.gov/files/medical%20devices/published/US-FDA-Artificial-Intelligence-and-Machine-Learning-Discussion-Paper.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>CO</given-names>
            </name>
            <name name-style="western">
              <surname>Walton</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Goehringer</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Aronson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Freimuth</surname>
              <given-names>RR</given-names>
            </name>
            <name name-style="western">
              <surname>Rasmussen</surname>
              <given-names>LV</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Prows</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>WK</given-names>
            </name>
            <name name-style="western">
              <surname>Fedotov</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nestor</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rowley</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Wiesner</surname>
              <given-names>GL</given-names>
            </name>
            <name name-style="western">
              <surname>Jarvik</surname>
              <given-names>GP</given-names>
            </name>
            <name name-style="western">
              <surname>Del Fiol</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Genomic Information for Clinicians in the Electronic Health Record: Lessons Learned From the Clinical Genome Resource Project and the Electronic Medical Records and Genomics Network</article-title>
          <source>Front Genet</source>
          <year>2019</year>
          <month>10</month>
          <day>29</day>
          <volume>10</volume>
          <fpage>1059</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31737042"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fgene.2019.01059</pub-id>
          <pub-id pub-id-type="medline">31737042</pub-id>
          <pub-id pub-id-type="pmcid">PMC6830110</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Cheung</surname>
              <given-names>YK</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Contemporary use of real-world data for clinical trial conduct in the United States: a scoping review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2021</year>
          <month>01</month>
          <day>15</day>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>144</fpage>
          <lpage>154</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33164065"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocaa224</pub-id>
          <pub-id pub-id-type="medline">33164065</pub-id>
          <pub-id pub-id-type="pii">5961445</pub-id>
          <pub-id pub-id-type="pmcid">PMC7810452</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bartlett</surname>
              <given-names>VL</given-names>
            </name>
            <name name-style="western">
              <surname>Dhruva</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>ND</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Feasibility of Using Real-World Data to Replicate Clinical Trial Evidence</article-title>
          <source>JAMA Netw Open</source>
          <year>2019</year>
          <month>10</month>
          <day>02</day>
          <volume>2</volume>
          <issue>10</issue>
          <fpage>e1912869</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31596493"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2019.12869</pub-id>
          <pub-id pub-id-type="medline">31596493</pub-id>
          <pub-id pub-id-type="pii">2752575</pub-id>
          <pub-id pub-id-type="pmcid">PMC6802419</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zarbin</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Real Life Outcomes vs. Clinical Trial Results</article-title>
          <source>J Ophthalmic Vis Res</source>
          <year>2019</year>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>88</fpage>
          <lpage>92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jovr.org/article.asp?issn=2008-322X;year=2019;volume=14;issue=1;spage=88;epage=92;aulast=Zarbin"/>
          </comment>
          <pub-id pub-id-type="doi">10.4103/jovr.jovr_279_18</pub-id>
          <pub-id pub-id-type="medline">30820292</pub-id>
          <pub-id pub-id-type="pii">JOVR-14-88</pub-id>
          <pub-id pub-id-type="pmcid">PMC6388532</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miksad</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Abernethy</surname>
              <given-names>AP</given-names>
            </name>
          </person-group>
          <article-title>Harnessing the Power of Real-World Evidence (RWE): A Checklist to Ensure Regulatory-Grade Data Quality</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2018</year>
          <month>02</month>
          <volume>103</volume>
          <issue>2</issue>
          <fpage>202</fpage>
          <lpage>205</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29214638"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cpt.946</pub-id>
          <pub-id pub-id-type="medline">29214638</pub-id>
          <pub-id pub-id-type="pmcid">PMC5814721</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Griffith</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Tucker</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bowser</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Calkins</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Guardino</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Khozin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kraut</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>You</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Schrag</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Miksad</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>Generating Real-World Tumor Burden Endpoints from Electronic Health Record Data: Comparison of RECIST, Radiology-Anchored, and Clinician-Anchored Approaches for Abstracting Real-World Progression in Non-Small Cell Lung Cancer</article-title>
          <source>Adv Ther</source>
          <year>2019</year>
          <month>08</month>
          <volume>36</volume>
          <issue>8</issue>
          <fpage>2122</fpage>
          <lpage>2136</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31140124"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s12325-019-00970-1</pub-id>
          <pub-id pub-id-type="medline">31140124</pub-id>
          <pub-id pub-id-type="pii">10.1007/s12325-019-00970-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC6822856</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gion</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pérez-García</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Llombart-Cussac</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sampayo-Cordero</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cortés</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Malfettone</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Surrogate endpoints for early-stage breast cancer: a review of the state of the art, controversies, and future prospects</article-title>
          <source>Ther Adv Med Oncol</source>
          <year>2021</year>
          <volume>13</volume>
          <fpage>17588359211059587</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/17588359211059587?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/17588359211059587</pub-id>
          <pub-id pub-id-type="medline">34868353</pub-id>
          <pub-id pub-id-type="pii">10.1177_17588359211059587</pub-id>
          <pub-id pub-id-type="pmcid">PMC8640314</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Korn</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>Sachs</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>McShane</surname>
              <given-names>LM</given-names>
            </name>
          </person-group>
          <article-title>Statistical controversies in clinical research: assessing pathologic complete response as a trial-level surrogate end point for early-stage breast cancer</article-title>
          <source>Ann Oncol</source>
          <year>2016</year>
          <month>01</month>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>10</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0923-7534(19)35359-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/annonc/mdv507</pub-id>
          <pub-id pub-id-type="medline">26489443</pub-id>
          <pub-id pub-id-type="pii">S0923-7534(19)35359-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC4701120</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kehl</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Riely</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lepisto</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Lavery</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Warner</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>LeNoue-Newton</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Sweeney</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Rudolph</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bedard</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Schrag</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Panageas</surname>
              <given-names>KS</given-names>
            </name>
            <collab>American Association of Cancer Research (AACR) Project Genomics Evidence Neoplasia Information Exchange (GENIE) Consortium</collab>
          </person-group>
          <article-title>Correlation Between Surrogate End Points and Overall Survival in a Multi-institutional Clinicogenomic Cohort of Patients With Non-Small Cell Lung or Colorectal Cancer</article-title>
          <source>JAMA Netw Open</source>
          <year>2021</year>
          <month>07</month>
          <day>01</day>
          <volume>4</volume>
          <issue>7</issue>
          <fpage>e2117547</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34309669"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2021.17547</pub-id>
          <pub-id pub-id-type="medline">34309669</pub-id>
          <pub-id pub-id-type="pii">2782339</pub-id>
          <pub-id pub-id-type="pmcid">PMC8314138</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Gossai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Monroe</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nussbaum</surname>
              <given-names>NC</given-names>
            </name>
            <name name-style="western">
              <surname>Parrinello</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Validation analysis of a composite real-world mortality endpoint for patients with cancer in the United States</article-title>
          <source>Health Serv Res</source>
          <year>2021</year>
          <month>12</month>
          <volume>56</volume>
          <issue>6</issue>
          <fpage>1281</fpage>
          <lpage>1287</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33998685"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/1475-6773.13669</pub-id>
          <pub-id pub-id-type="medline">33998685</pub-id>
          <pub-id pub-id-type="pmcid">PMC8586476</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ngo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Keegan</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Jonas</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Hogarth</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>KK</given-names>
            </name>
          </person-group>
          <article-title>Assessing the Quality of Electronic Data for 'Fit-for-Purpose' by Utilizing Data Profiling Techniques Prior to Conducting a Survival Analysis for Adults with Acute Lymphoblastic Leukemia</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2020</year>
          <volume>2020</volume>
          <fpage>915</fpage>
          <lpage>924</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33936467"/>
          </comment>
          <pub-id pub-id-type="medline">33936467</pub-id>
          <pub-id pub-id-type="pii">127_3410402</pub-id>
          <pub-id pub-id-type="pmcid">PMC8075459</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Katkade</surname>
              <given-names>VB</given-names>
            </name>
            <name name-style="western">
              <surname>Sanders</surname>
              <given-names>KN</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>KH</given-names>
            </name>
          </person-group>
          <article-title>Real world data: an opportunity to supplement existing evidence for the use of long-established medicines in health care decision making</article-title>
          <source>J Multidiscip Healthc</source>
          <year>2018</year>
          <volume>11</volume>
          <fpage>295</fpage>
          <lpage>304</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29997436"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/JMDH.S160029</pub-id>
          <pub-id pub-id-type="medline">29997436</pub-id>
          <pub-id pub-id-type="pii">jmdh-11-295</pub-id>
          <pub-id pub-id-type="pmcid">PMC6033114</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Boruvka</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Bias in progression-free survival analysis due to intermittent assessment of progression</article-title>
          <source>Stat Med</source>
          <year>2015</year>
          <month>10</month>
          <day>30</day>
          <volume>34</volume>
          <issue>24</issue>
          <fpage>3181</fpage>
          <lpage>93</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26011411"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/sim.6529</pub-id>
          <pub-id pub-id-type="medline">26011411</pub-id>
          <pub-id pub-id-type="pmcid">PMC4744753</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>von Allmen</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tevaearai</surname>
              <given-names>HT</given-names>
            </name>
            <name name-style="western">
              <surname>Kuemmerli</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tinner</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Carrel</surname>
              <given-names>TP</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidli</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dick</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Completeness of Follow-Up Determines Validity of Study Findings: Results of a Prospective Repeated Measures Cohort Study</article-title>
          <source>PLoS One</source>
          <year>2015</year>
          <volume>10</volume>
          <issue>10</issue>
          <fpage>e0140817</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://boris.unibe.ch/id/eprint/74901"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0140817</pub-id>
          <pub-id pub-id-type="medline">26469346</pub-id>
          <pub-id pub-id-type="pii">PONE-D-15-20252</pub-id>
          <pub-id pub-id-type="pmcid">PMC4607456</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haslam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gill</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Prasad</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>The frequency of assessment of progression in randomized oncology clinical trials</article-title>
          <source>Cancer Rep (Hoboken)</source>
          <year>2022</year>
          <month>07</month>
          <volume>5</volume>
          <issue>7</issue>
          <fpage>e1527</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34821077"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cnr2.1527</pub-id>
          <pub-id pub-id-type="medline">34821077</pub-id>
          <pub-id pub-id-type="pmcid">PMC9327664</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Holmgren</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Downing</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Bates</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Shanafelt</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Milstein</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sharp</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Cutler</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Huckman</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Schulman</surname>
              <given-names>KA</given-names>
            </name>
          </person-group>
          <article-title>Assessment of Electronic Health Record Use Between US and Non-US Health Systems</article-title>
          <source>JAMA Intern Med</source>
          <year>2021</year>
          <month>02</month>
          <day>01</day>
          <volume>181</volume>
          <issue>2</issue>
          <fpage>251</fpage>
          <lpage>259</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33315048"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamainternmed.2020.7071</pub-id>
          <pub-id pub-id-type="medline">33315048</pub-id>
          <pub-id pub-id-type="pii">2774129</pub-id>
          <pub-id pub-id-type="pmcid">PMC7737152</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Glynn</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Singer</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Lii</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schneeweiss</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Out-of-system Care and Recording of Patient Characteristics Critical for Comparative Effectiveness Research</article-title>
          <source>Epidemiology</source>
          <year>2018</year>
          <month>05</month>
          <volume>29</volume>
          <issue>3</issue>
          <fpage>356</fpage>
          <lpage>363</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29283893"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/EDE.0000000000000794</pub-id>
          <pub-id pub-id-type="medline">29283893</pub-id>
          <pub-id pub-id-type="pmcid">PMC5882528</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hatch</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tillotson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Angier</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Marino</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hoopes</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Huguet</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>DeVoe</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Using the electronic health record for assessment of health insurance in community health centers</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2016</year>
          <month>09</month>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>984</fpage>
          <lpage>90</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26911812"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocv179</pub-id>
          <pub-id pub-id-type="medline">26911812</pub-id>
          <pub-id pub-id-type="pii">ocv179</pub-id>
          <pub-id pub-id-type="pmcid">PMC6375120</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Burcu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Manzano-Salgado</surname>
              <given-names>CB</given-names>
            </name>
            <name name-style="western">
              <surname>Butler</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Christian</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>A Framework for Extension Studies Using Real-World Data to Examine Long-Term Safety and Effectiveness</article-title>
          <source>Ther Innov Regul Sci</source>
          <year>2022</year>
          <month>01</month>
          <volume>56</volume>
          <issue>1</issue>
          <fpage>15</fpage>
          <lpage>22</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34251656"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s43441-021-00322-8</pub-id>
          <pub-id pub-id-type="medline">34251656</pub-id>
          <pub-id pub-id-type="pii">10.1007/s43441-021-00322-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC8274256</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Suissa</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Immortal time bias in pharmaco-epidemiology</article-title>
          <source>Am J Epidemiol</source>
          <year>2008</year>
          <month>02</month>
          <day>15</day>
          <volume>167</volume>
          <issue>4</issue>
          <fpage>492</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1093/aje/kwm324</pub-id>
          <pub-id pub-id-type="medline">18056625</pub-id>
          <pub-id pub-id-type="pii">kwm324</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tyrer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Bhaskaran</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Rutherford</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Immortal time bias for life-long conditions in retrospective observational studies using electronic health records</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2022</year>
          <month>03</month>
          <day>27</day>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>86</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/s12874-022-01581-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12874-022-01581-1</pub-id>
          <pub-id pub-id-type="medline">35350993</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12874-022-01581-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC8962148</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hernán</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Robins</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Using Big Data to Emulate a Target Trial When a Randomized Trial Is Not Available</article-title>
          <source>Am J Epidemiol</source>
          <year>2016</year>
          <month>04</month>
          <day>15</day>
          <volume>183</volume>
          <issue>8</issue>
          <fpage>758</fpage>
          <lpage>64</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26994063"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/aje/kwv254</pub-id>
          <pub-id pub-id-type="medline">26994063</pub-id>
          <pub-id pub-id-type="pii">kwv254</pub-id>
          <pub-id pub-id-type="pmcid">PMC4832051</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Backenroth</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>How to choose a time zero for patients in external control arms</article-title>
          <source>Pharm Stat</source>
          <year>2021</year>
          <month>07</month>
          <volume>20</volume>
          <issue>4</issue>
          <fpage>783</fpage>
          <lpage>792</lpage>
          <pub-id pub-id-type="doi">10.1002/pst.2107</pub-id>
          <pub-id pub-id-type="medline">33655598</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>JW</given-names>
            </name>
          </person-group>
          <article-title>Diagnostics for Confounding of Time-varying and Other Joint Exposures</article-title>
          <source>Epidemiology</source>
          <year>2016</year>
          <month>11</month>
          <volume>27</volume>
          <issue>6</issue>
          <fpage>859</fpage>
          <lpage>69</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27479649"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/EDE.0000000000000547</pub-id>
          <pub-id pub-id-type="medline">27479649</pub-id>
          <pub-id pub-id-type="pmcid">PMC5308856</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thorlund</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dron</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>JJH</given-names>
            </name>
            <name name-style="western">
              <surname>Mills</surname>
              <given-names>EJ</given-names>
            </name>
          </person-group>
          <article-title>Synthetic and External Controls in Clinical Trials - A Primer for Researchers</article-title>
          <source>Clin Epidemiol</source>
          <year>2020</year>
          <volume>12</volume>
          <fpage>457</fpage>
          <lpage>467</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32440224"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/CLEP.S242097</pub-id>
          <pub-id pub-id-type="medline">32440224</pub-id>
          <pub-id pub-id-type="pii">242097</pub-id>
          <pub-id pub-id-type="pmcid">PMC7218288</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lau</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jamali</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Loebenberg</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Health Canada Usage of Real World Evidence (RWE) in Regulatory Decision Making compared with FDA/EMA usage based on publicly available information</article-title>
          <source>J Pharm Pharm Sci</source>
          <year>2022</year>
          <volume>25</volume>
          <fpage>227</fpage>
          <lpage>236</lpage>
          <pub-id pub-id-type="doi">10.18433/jpps32715</pub-id>
          <pub-id pub-id-type="medline">35760071</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="web">
          <article-title>FDA Acceptance of Foreign Clinical Studies Not Conducted Under an IND: Frequently Asked Questions: Guidance for Industry and FDA Staff</article-title>
          <source>Food and Drug Administration</source>
          <access-date>2023-02-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fda.gov/regulatory-information/search-fda-guidance-documents/fda-acceptance-foreign-clinical-studies-not-conducted-under-ind-frequently-asked-questions">https://www.fda.gov/regulatory-information/search-fda-guidance-documents/fda-acceptance-foreign-clinical-studies-not-conducted-under-ind-frequently-asked-questions</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McNair</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lumpkin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kern</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hartman</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Use of RWE to Inform Regulatory, Public Health Policy, and Intervention Priorities for the Developing World</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2022</year>
          <month>01</month>
          <volume>111</volume>
          <issue>1</issue>
          <fpage>44</fpage>
          <lpage>51</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34655224"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cpt.2449</pub-id>
          <pub-id pub-id-type="medline">34655224</pub-id>
          <pub-id pub-id-type="pmcid">PMC9298255</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Barrett</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Heaton</surname>
              <given-names>PM</given-names>
            </name>
          </person-group>
          <article-title>Real-World Data: An Unrealized Opportunity in Global Health?</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2019</year>
          <month>07</month>
          <volume>106</volume>
          <issue>1</issue>
          <fpage>57</fpage>
          <lpage>59</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31188467"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cpt.1476</pub-id>
          <pub-id pub-id-type="medline">31188467</pub-id>
          <pub-id pub-id-type="pmcid">PMC6771465</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ramagopalan</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Popat</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Boyne</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lockhart</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>O'Sullivan</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Inskip</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ray</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cheung</surname>
              <given-names>WY</given-names>
            </name>
            <name name-style="western">
              <surname>Griesinger</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Subbiah</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Transportability of Overall Survival Estimates From US to Canadian Patients With Advanced Non-Small Cell Lung Cancer With Implications for Regulatory and Health Technology Assessment</article-title>
          <source>JAMA Netw Open</source>
          <year>2022</year>
          <month>11</month>
          <day>01</day>
          <volume>5</volume>
          <issue>11</issue>
          <fpage>e2239874</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36326765"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2022.39874</pub-id>
          <pub-id pub-id-type="medline">36326765</pub-id>
          <pub-id pub-id-type="pii">2798150</pub-id>
          <pub-id pub-id-type="pmcid">PMC9634498</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Degtiar</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Rose</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A Review of Generalizability and Transportability</article-title>
          <source>Annu. Rev. Stat. Appl</source>
          <year>2022</year>
          <month>10</month>
          <day>19</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>103837</fpage>
          <pub-id pub-id-type="doi">10.1146/annurev-statistics-042522-103837</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brixner</surname>
              <given-names>DI</given-names>
            </name>
            <name name-style="western">
              <surname>Holtorf</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Neumann</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Malone</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Watkins</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>Standardizing quality assessment of observational studies for decision making in health care</article-title>
          <source>J Manag Care Pharm</source>
          <year>2009</year>
          <month>04</month>
          <volume>15</volume>
          <issue>3</issue>
          <fpage>275</fpage>
          <lpage>83</lpage>
          <pub-id pub-id-type="doi">10.18553/jmcp.2009.15.3.275</pub-id>
          <pub-id pub-id-type="medline">19326959</pub-id>
          <pub-id pub-id-type="pii">2009(15)3: 275-283</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>PLOS Medicine Editors</collab>
          </person-group>
          <article-title>Observational studies: getting clear about transparency</article-title>
          <source>PLoS Med</source>
          <year>2014</year>
          <month>08</month>
          <volume>11</volume>
          <issue>8</issue>
          <fpage>e1001711</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pmed.1001711"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pmed.1001711</pub-id>
          <pub-id pub-id-type="medline">25158064</pub-id>
          <pub-id pub-id-type="pii">PMEDICINE-D-14-02305</pub-id>
          <pub-id pub-id-type="pmcid">PMC4144975</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Segal</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Kallich</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Oppenheim</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Garrison</surname>
              <given-names>LP</given-names>
            </name>
            <name name-style="western">
              <surname>Iqbal</surname>
              <given-names>SU</given-names>
            </name>
            <name name-style="western">
              <surname>Kessler</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>GC</given-names>
            </name>
          </person-group>
          <article-title>Using Certification to Promote Uptake of Real-World Evidence by Payers</article-title>
          <source>J Manag Care Spec Pharm</source>
          <year>2016</year>
          <month>03</month>
          <volume>22</volume>
          <issue>3</issue>
          <fpage>191</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.18553/jmcp.2016.22.3.191</pub-id>
          <pub-id pub-id-type="medline">27003547</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="web">
          <article-title>Best Practices for Conducting and Reporting Pharmacoepidemiologic Safety Studies Using Electronic Healthcare Data Sets</article-title>
          <source>Food and Drug Administration</source>
          <access-date>2023-02-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fda.gov/regulatory-information/search-fda-guidance-documents/best-practices-conducting-and-reporting-pharmacoepidemiologic-safety-studies-using-electronic">https://www.fda.gov/regulatory-information/search-fda-guidance-documents/best-practices-conducting-and-reporting-pharmacoepidemiologic-safety-studies-using-electronic</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berger</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Sox</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Willke</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Brixner</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Eichler</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Goettsch</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Madigan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Makady</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schneeweiss</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tarricone</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Watkins</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Daniel Mullins</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Good practices for real-world data studies of treatment and/or comparative effectiveness: Recommendations from the joint ISPOR-ISPE Special Task Force on real-world evidence in health care decision making</article-title>
          <source>Pharmacoepidemiol Drug Saf</source>
          <year>2017</year>
          <month>09</month>
          <day>15</day>
          <volume>26</volume>
          <issue>9</issue>
          <fpage>1033</fpage>
          <lpage>1039</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28913966"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/pds.4297</pub-id>
          <pub-id pub-id-type="medline">28913966</pub-id>
          <pub-id pub-id-type="pmcid">PMC5639372</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maarseveen</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Maurits</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Niemantsverdriet</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>van der Helm-van Mil</surname>
              <given-names>AHM</given-names>
            </name>
            <name name-style="western">
              <surname>Huizinga</surname>
              <given-names>TWJ</given-names>
            </name>
            <name name-style="western">
              <surname>Knevel</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Handwork vs machine: a comparison of rheumatoid arthritis patient populations as identified from EHR free-text by diagnosis extraction through machine-learning or traditional criteria-based chart review</article-title>
          <source>Arthritis Res Ther</source>
          <year>2021</year>
          <month>06</month>
          <day>22</day>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>174</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arthritis-research.biomedcentral.com/articles/10.1186/s13075-021-02553-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13075-021-02553-4</pub-id>
          <pub-id pub-id-type="medline">34158089</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13075-021-02553-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC8218515</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ayala Solares</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Diletta Raimondi</surname>
              <given-names>FE</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rahimian</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Canoy</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pinho Gomes</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Payberah</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Zottoli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nazarzadeh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Conrad</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Rahimi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Salimi-Khorshidi</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Deep learning for electronic health records: A comparative review of multiple deep neural architectures</article-title>
          <source>J Biomed Inform</source>
          <year>2020</year>
          <month>01</month>
          <volume>101</volume>
          <fpage>103337</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30256-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103337</pub-id>
          <pub-id pub-id-type="medline">31916973</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30256-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brazeal</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Alekseyenko</surname>
              <given-names>AV</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Fugal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kirchoff</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Marsh</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lewin</surname>
              <given-names>DN</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Obeid</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Assessing quality and agreement of structured data in automatic versus manual abstraction of the electronic health record for a clinical epidemiology study</article-title>
          <source>Research Methods in Medicine &#38; Health Sciences</source>
          <year>2021</year>
          <month>11</month>
          <day>22</day>
          <volume>2</volume>
          <issue>4</issue>
          <fpage>168</fpage>
          <lpage>178</lpage>
          <pub-id pub-id-type="doi">10.1177/26320843211061287</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dagenais</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Russo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Madsen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Webster</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Becnel</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Use of Real-World Evidence to Drive Drug Development Strategy and Inform Clinical Trial Design</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2022</year>
          <month>01</month>
          <volume>111</volume>
          <issue>1</issue>
          <fpage>77</fpage>
          <lpage>89</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34839524"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/cpt.2480</pub-id>
          <pub-id pub-id-type="medline">34839524</pub-id>
          <pub-id pub-id-type="pmcid">PMC9299990</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Dehmer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yli-Harja</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Emmert-Streib</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Combining deep learning with token selection for patient phenotyping from electronic health records</article-title>
          <source>Sci Rep</source>
          <year>2020</year>
          <month>01</month>
          <day>29</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>1432</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-020-58178-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-020-58178-1</pub-id>
          <pub-id pub-id-type="medline">31996705</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-020-58178-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC6989657</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harvey</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Rassen</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Kabelac</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Turenne</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Leonard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Klesh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Kaufman</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Petkov</surname>
              <given-names>VI</given-names>
            </name>
            <name name-style="western">
              <surname>Cronin</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Van Dyke</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Lowy</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Sharpless</surname>
              <given-names>NE</given-names>
            </name>
            <name name-style="western">
              <surname>Penberthy</surname>
              <given-names>LT</given-names>
            </name>
          </person-group>
          <article-title>Association of SARS-CoV-2 Seropositive Antibody Test With Risk of Future Infection</article-title>
          <source>JAMA Intern Med</source>
          <year>2021</year>
          <month>05</month>
          <day>01</day>
          <volume>181</volume>
          <issue>5</issue>
          <fpage>672</fpage>
          <lpage>679</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33625463"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamainternmed.2021.0366</pub-id>
          <pub-id pub-id-type="medline">33625463</pub-id>
          <pub-id pub-id-type="pii">2776810</pub-id>
          <pub-id pub-id-type="pmcid">PMC7905701</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dron</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kalatharan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haggstrom</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zariffa</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Morris</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Arora</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Data capture and sharing in the COVID-19 pandemic: a cause for concern</article-title>
          <source>Lancet Digit Health</source>
          <year>2022</year>
          <month>10</month>
          <volume>4</volume>
          <issue>10</issue>
          <fpage>e748</fpage>
          <lpage>e756</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2589-7500(22)00147-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S2589-7500(22)00147-9</pub-id>
          <pub-id pub-id-type="medline">36150783</pub-id>
          <pub-id pub-id-type="pii">S2589-7500(22)00147-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC9489064</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alzu'bi</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Watzlaf</surname>
              <given-names>VJM</given-names>
            </name>
            <name name-style="western">
              <surname>Sheridan</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Electronic Health Record (EHR) Abstraction</article-title>
          <source>Perspect Health Inf Manag</source>
          <year>2021</year>
          <volume>18</volume>
          <issue>Spring</issue>
          <fpage>1g</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34035788"/>
          </comment>
          <pub-id pub-id-type="medline">34035788</pub-id>
          <pub-id pub-id-type="pii">phim0018-0001g</pub-id>
          <pub-id pub-id-type="pmcid">PMC8120673</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Bellomo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Magee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bennette</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Tymejczyk</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Samant</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tucker</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nussbaum</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bowser</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Kraut</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Bourla</surname>
              <given-names>AB</given-names>
            </name>
          </person-group>
          <article-title>Characterization of a Real-World Response Variable and Comparison with RECIST-Based Response Rates from Clinical Trials in Advanced NSCLC</article-title>
          <source>Adv Ther</source>
          <year>2021</year>
          <month>04</month>
          <volume>38</volume>
          <issue>4</issue>
          <fpage>1843</fpage>
          <lpage>1859</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33674928"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s12325-021-01659-0</pub-id>
          <pub-id pub-id-type="medline">33674928</pub-id>
          <pub-id pub-id-type="pii">10.1007/s12325-021-01659-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC8004504</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Popat</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Scheuer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>GG</given-names>
            </name>
            <name name-style="western">
              <surname>Lockhart</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ramagopalan</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Griesinger</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Subbiah</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Addressing challenges with real-world synthetic control arms to demonstrate the comparative effectiveness of Pralsetinib in non-small cell lung cancer</article-title>
          <source>Nat Commun</source>
          <year>2022</year>
          <month>06</month>
          <day>17</day>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>3500</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41467-022-30908-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41467-022-30908-1</pub-id>
          <pub-id pub-id-type="medline">35715405</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41467-022-30908-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC9205915</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bennett</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mann</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ouyang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Utilizing Combined Claims and Clinical Datasets for Research Among Potential Cases of Rare Diseases</article-title>
          <source>Int J Healthc Inf Syst Inform</source>
          <year>2018</year>
          <volume>13</volume>
          <issue>2</issue>
          <fpage>1</fpage>
          <lpage>12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32913425"/>
          </comment>
          <pub-id pub-id-type="doi">10.4018/ijhisi.2018040101</pub-id>
          <pub-id pub-id-type="medline">32913425</pub-id>
          <pub-id pub-id-type="pmcid">PMC7479970</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wells</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chagin</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Nowacki</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Kattan</surname>
              <given-names>MW</given-names>
            </name>
          </person-group>
          <article-title>Strategies for handling missing data in electronic health record derived data</article-title>
          <source>EGEMS (Wash DC)</source>
          <year>2013</year>
          <volume>1</volume>
          <issue>3</issue>
          <fpage>1035</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25848578"/>
          </comment>
          <pub-id pub-id-type="doi">10.13063/2327-9214.1035</pub-id>
          <pub-id pub-id-type="medline">25848578</pub-id>
          <pub-id pub-id-type="pii">egems1035</pub-id>
          <pub-id pub-id-type="pmcid">PMC4371484</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Just</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Marc</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Munns</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sandefer</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Why Patient Matching Is a Challenge: Research on Master Patient Index (MPI) Data Discrepancies in Key Identifying Fields</article-title>
          <source>Perspect Health Inf Manag</source>
          <year>2016</year>
          <volume>13</volume>
          <issue>Spring</issue>
          <fpage>1e</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27134610"/>
          </comment>
          <pub-id pub-id-type="medline">27134610</pub-id>
          <pub-id pub-id-type="pmcid">PMC4832129</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>EK</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>CP</given-names>
            </name>
          </person-group>
          <article-title>Values and pitfalls of the use of administrative databases for outcomes assessment</article-title>
          <source>J Urol</source>
          <year>2013</year>
          <month>07</month>
          <volume>190</volume>
          <issue>1</issue>
          <fpage>17</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23608038"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.juro.2013.04.048</pub-id>
          <pub-id pub-id-type="medline">23608038</pub-id>
          <pub-id pub-id-type="pii">S0022-5347(13)04098-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC4114235</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Strom</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Faridi</surname>
              <given-names>KF</given-names>
            </name>
            <name name-style="western">
              <surname>Butala</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tamez</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Valsdottir</surname>
              <given-names>LR</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Popma</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kazi</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Yeh</surname>
              <given-names>RW</given-names>
            </name>
          </person-group>
          <article-title>Use of Administrative Claims to Assess Outcomes and Treatment Effect in Randomized Clinical Trials for Transcatheter Aortic Valve Replacement</article-title>
          <source>Circulation</source>
          <year>2020</year>
          <month>07</month>
          <day>21</day>
          <volume>142</volume>
          <issue>3</issue>
          <fpage>203</fpage>
          <lpage>213</lpage>
          <pub-id pub-id-type="doi">10.1161/circulationaha.120.046159</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Curtis</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Baddley</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Patkar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Delzell</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Mikuls</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Saag</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Safford</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cannon</surname>
              <given-names>GW</given-names>
            </name>
          </person-group>
          <article-title>Derivation and preliminary validation of an administrative claims-based algorithm for the effectiveness of medications for rheumatoid arthritis</article-title>
          <source>Arthritis Res Ther</source>
          <year>2011</year>
          <volume>13</volume>
          <issue>5</issue>
          <fpage>R155</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arthritis-research.biomedcentral.com/articles/10.1186/ar3471"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/ar3471</pub-id>
          <pub-id pub-id-type="medline">21933396</pub-id>
          <pub-id pub-id-type="pii">ar3471</pub-id>
          <pub-id pub-id-type="pmcid">PMC3308085</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
