<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v22i3e16810</article-id>
      <article-id pub-id-type="pmid">32196460</article-id>
      <article-id pub-id-type="doi">10.2196/16810</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Blockchain-Authenticated Sharing of Genomic and Clinical Outcomes Data of Patients With Cancer: A Prospective Cohort Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Rusu</surname>
            <given-names>Lucia</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Yin</surname>
            <given-names>Kanhua</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Glicksberg</surname>
            <given-names>Benjamin Scott</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4515-8090</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Burns</surname>
            <given-names>Shohei</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7622-4658</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Currie</surname>
            <given-names>Rob</given-names>
          </name>
          <degrees>MBA</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1828-1827</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Griffin</surname>
            <given-names>Ann</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0837-6515</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Zhen Jane</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2065-5296</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Haussler</surname>
            <given-names>David</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff8" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1533-4575</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Goldstein</surname>
            <given-names>Theodore</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7424-5041</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Collisson</surname>
            <given-names>Eric</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <address>
            <institution>Division of Hematology and Oncology</institution>
            <institution>Department of Medicine</institution>
            <institution>University of California</institution>
            <addr-line>1450 3rd Street</addr-line>
            <addr-line>San Francisco, CA, 94158</addr-line>
            <country>United States</country>
            <phone>1 4153539888</phone>
            <email>collissonlab@gmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8037-9388</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Bakar Computational Health Sciences Institute</institution>
        <institution>University of California</institution>
        <addr-line>San Francisco, CA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Hasso Plattner Institute for Digital Health at Mount Sinai</institution>
        <institution>Icahn School of Medicine at Mount Sinai</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Genetics and Genomic Sciences</institution>
        <institution>Icahn School of Medicine at Mount Sinai</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Division of Hematology and Oncology</institution>
        <institution>Department of Medicine</institution>
        <institution>University of California</institution>
        <addr-line>San Francisco, CA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>UC Santa Cruz Genomics Institute</institution>
        <institution>University of California, Santa Cruz</institution>
        <addr-line>Santa Cruz, CA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Helen Diller Family Comprehensive Cancer Center</institution>
        <institution>University of California</institution>
        <addr-line>San Francisco, CA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Department of Radiology and Biomedical Imaging</institution>
        <institution>University of California</institution>
        <addr-line>San Francisco, CA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff8">
        <label>8</label>
        <institution>Howard Hughes Medical Institute</institution>
        <addr-line>Santa Cruz, CA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Eric Collisson <email>collissonlab@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>3</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>20</day>
        <month>3</month>
        <year>2020</year>
      </pub-date>
      <volume>22</volume>
      <issue>3</issue>
      <elocation-id>e16810</elocation-id>
      <history>
        <date date-type="received">
          <day>27</day>
          <month>10</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>15</day>
          <month>11</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>9</day>
          <month>12</month>
          <year>2019</year>
        </date>
        <date date-type="accepted">
          <day>15</day>
          <month>12</month>
          <year>2019</year>
        </date>
      </history>
      <copyright-statement>©Benjamin Scott Glicksberg, Shohei Burns, Rob Currie, Ann Griffin, Zhen Jane Wang, David Haussler, Theodore Goldstein, Eric Collisson. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 20.03.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://www.jmir.org/2020/3/e16810/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Efficiently sharing health data produced during standard care could dramatically accelerate progress in cancer treatments, but various barriers make this difficult. Not sharing these data to ensure patient privacy is at the cost of little to no learning from real-world data produced during cancer care. Furthermore, recent research has demonstrated a willingness of patients with cancer to share their treatment experiences to fuel research, despite potential risks to privacy.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The objective of this study was to design, pilot, and release a decentralized, scalable, efficient, economical, and secure strategy for the dissemination of deidentified clinical and genomic data with a focus on late-stage cancer.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We created and piloted a blockchain-authenticated system to enable secure sharing of deidentified patient data derived from standard of care imaging, genomic testing, and electronic health records (EHRs), called the Cancer Gene Trust (CGT). We prospectively consented and collected data for a pilot cohort (N=18), which we uploaded to the CGT. EHR data were extracted from both a hospital cancer registry and a common data model (CDM) format to identify optimal data extraction and dissemination practices. Specifically, we scored and compared the level of completeness between two EHR data extraction formats against the gold standard source documentation for patients with available data (n=17).</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Although the total completeness scores were greater for the registry reports than those for the CDM, this difference was not statistically significant. We did find that some specific data fields, such as histology site, were better captured using the registry reports, which can be used to improve the continually adapting CDM. In terms of the overall pilot study, we found that CGT enables rapid integration of real-world data of patients with cancer in a more clinically useful time frame. We also developed an open-source Web application to allow users to seamlessly search, browse, explore, and download CGT data.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our pilot demonstrates the willingness of patients with cancer to participate in data sharing and how blockchain-enabled structures can maintain relationships between individual data elements while preserving patient privacy, empowering findings by third-party researchers and clinicians. We demonstrate the feasibility of CGT as a framework to share health data trapped in silos to further cancer research. Further studies to optimize data representation, stream, and integrity are required.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>data sharing</kwd>
        <kwd>electronic health records</kwd>
        <kwd>genomics</kwd>
        <kwd>medicine</kwd>
        <kwd>blockchain</kwd>
        <kwd>neoplasms</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Every patient with cancer has a unique disease composition and presentation that demands interrogation of complex imaging and genome characteristics [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>] for personalized treatment recommendations. Currently, it is still standard to report outcomes of cancer as group averages from clinical trials treated with prospectively dictated regimens. Individual patient outcomes from real-world data could further advance personalized medicine by allowing dramatically more treatments and outcomes to be considered [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. As such a health system can learn from its own data to improve its delivery of patient care [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. Regulatory requirements and other restrictions prevent much patient-level data from being shared. Research progress suffers as a result. Precision medicine methodologies such as next-generation tumor DNA sequencing are now often performed in routine cancer care. Unfortunately, results are siloed in individual institutions, frustrating effective sharing or pooling of datasets [<xref ref-type="bibr" rid="ref8">8</xref>]. Many patients with cancer, however, are willing to share their data and believe that the positive benefits outweigh the potential privacy risks: 93% of patients surveyed would be very or somewhat likely to share their data with university scientists [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
      <p>Despite this need and patients’ willingness to share their data, robust deidentified data sharing methods are lacking. Innovative alternative strategies have been developed that aim to anonymize identifiable clinical data in a way that preserves inherent structure, such as using generative adversarial networks [<xref ref-type="bibr" rid="ref10">10</xref>], but these have not as of yet been deployed for large-scale, multiomic discovery. One immediate challenge of creating an extensible and robust framework is identifying which data are necessary to share (and in what format), minimizing risk for patient reidentification while maximizing viable information that can lead to clinical insight. Conley et al [<xref ref-type="bibr" rid="ref11">11</xref>] released a core set of clinical data elements that various stakeholders agreed on for cancer genomic repositories. The lack of a standard data sharing platform for clinical data arises from myriad causes, including but not limited to, incompatible data streams or formats, nonstandardized collection, conflicting business models, extraction and accessibility procedures, and privacy concerns. A centralized, curated platform operated by a single institution is not ideal due to concerns of data ownership, cost, and dissemination procedures. Trends in other fields have migrated from analyzing batched data quarterly, whether from customer Web clicks or manufacturing floor sensors, to real-time analyses. Learning cycles have been reduced from months to hours. Finally, centralized top-down data sharing efforts, although critical to research and scientific deductive understanding, have a fixed lifetime of the study, grant, or group interest.</p>
      <p>Software standards based on health care data sharing and electronic commerce are converging to enable solutions to the compelling need to share patient health data for both care management and medical research. In 2013, the Global Alliance for Genomic Health [<xref ref-type="bibr" rid="ref12">12</xref>] was established to enable a framework for secure, responsible, and effective clinical and genomic data sharing. In 2016, the US president unveiled the National Cancer Institute Cancer Moonshot effort to accelerate cancer research, including efforts focused on data sharing (the Public Access and Data Sharing Policy). Since then, significant progress has been made in mining and sharing medical data. The Food and Drug Administration announced a collaboration with Flatiron Health to utilize deidentified clinical data for the analysis and development of anticancer therapies outside of clinical trials in 2016. Recent studies have delivered on that promise: Agarwal et al [<xref ref-type="bibr" rid="ref7">7</xref>] analyzed more than 7000 clinical and genomic records from the Flatiron Health network and Foundation Medicine to calculate the tumor mutation burden across cancer subtypes. Singal et al [<xref ref-type="bibr" rid="ref13">13</xref>] demonstrated that data collected from routine clinical care of almost 30,000 patients with cancer can yield novel clinical insights, as evidenced in this case for non–small cell lung cancer.</p>
      <p>A decentralized, scalable, efficient, economical, and secure strategy, such as blockchain technology, can fulfill requirements for effective clinical data sharing. Although not perfect in their scope [<xref ref-type="bibr" rid="ref14">14</xref>], blockchain systems by design are secure and resistant to tampering and distributed with no single point of control or failure allowing transactions to be efficiently recorded and verified. Multiple publications have proposed the utility of blockchain technology for secure and scalable clinical data sharing [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref19">19</xref>], and many companies and organizations are applying blockchain platforms in health care [<xref ref-type="bibr" rid="ref20">20</xref>]. Although the excitement surrounding the utilization of blockchain for distributing health care data is encouraging [<xref ref-type="bibr" rid="ref21">21</xref>], many studies are private, theoretical (ie, accessing feasibility), or unsuccessful in scope. In a recent systematic review of 71 studies that discussed managing health care records via blockchain, only four actually were tested on live data [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
      <p>Here, we develop a public demonstration of curated collection that focuses on capturing the data created over the normal course of clinical care as rapidly as possible. The Cancer Gene Trust (CGT) [<xref ref-type="bibr" rid="ref23">23</xref>] democratizes data analysis, enabling more experts to participate and compare results, and accelerates the translation of genomic findings toward a clinically useful timescale. CGT is the first free, simple, rapid, global network to share deidentified cancer somatic mutations, radiographic and pathological images, and associated clinical data for prospectively consented patients. These data are rapidly deposited into a global off-blockchain distributed and decentralized repository. This framework not only allows for the rapid dissemination of high yield and important data but also openly details the rigorous process for deidentification, study design, and informed patient consent. From the findings of Mello et al [<xref ref-type="bibr" rid="ref9">9</xref>], we hypothesized that most patients are willing to consent to their data being shared if it helps expand the corpus of medical knowledge. We aim to demonstrate the utility of CGT by releasing such data from a pilot study of 18 consented patients along with an open-source and freely available application for visualization and exploration.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design and Recruitment</title>
        <p>The University of California, San Francisco (UCSF) institutional review board (IRB) approved our pilot study to consent patients for distributing their deidentified information on CGT (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for study protocol). We approached and consented 18 patients under care at UCSF Medical Center to the <italic>Sharing Clinical and Genomic Data in Cancer Research</italic> clinical pilot protocol (IRB #16-20857).</p>
      </sec>
      <sec>
        <title>The Cancer Gene Trust Framework</title>
        <p>CGT is a decentralized, distributed content addressable real-time database. A submission consists of a manifest containing fields and references to files by hash. Submissions may include deidentified clinical fields, a list of somatic mutations, gene expression, or any type of data relevant to a patient. Submissions are tracked per steward (ie, institution or organization) via a smart contract on the Ethereum [<xref ref-type="bibr" rid="ref24">24</xref>] blockchain, which references the underlying data stored via hash in InterPlanetary File System (IPFS) [<xref ref-type="bibr" rid="ref25">25</xref>]. IPFS is inherently decentralized and distributed. Any node may request data from any other node via the unique hash of the data and cache it locally. This affords organic replication of data as well as scalable access. An institution performing internal access and analysis of data may run their own IPFS server and thereby allow high-speed LAN access with only the initial request traversing the list of IPFS servers to find data matching the hash.</p>
      </sec>
      <sec>
        <title>Data Collection Procedures</title>
        <p>We carefully navigated all institutional procedures to educate and consent our patients before obtaining, formatting, and distributing deidentified patient data from our cohort (<xref rid="figure1" ref-type="fig">Figure 1</xref>). We performed stringent and comprehensive privacy processes to be as confident as possible so that no identifying personal health information would be shared (see Data Deidentification section). For the 18 enrolled patients, we were given permission to obtain clinical documentation from their electronic health record (EHR), their somatic mutation information, as well as any scans taken [<xref ref-type="bibr" rid="ref26">26</xref>]. All data, including genomic, imaging, and structured EHR data (eg, treatment information), for the first cohort of consented patients are available [<xref ref-type="bibr" rid="ref23">23</xref>]. Patients are identified by a universally unique identifier (UUID-4). The only mapping to the actual patient is securely controlled by trusted stewards; in this case, UCSF. All source code and documentation for CGT are available [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Workflow and pipeline for Cancer Gene Trust. EHR: electronic health record; HIPAA: Health Insurance Portability and Accountability Act.</p>
          </caption>
          <graphic xlink:href="jmir_v22i3e16810_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <sec>
          <title>Overall Workflow for Cancer Gene Trust Pipeline</title>
          <p>Patients are consented to agree to release their deidentified clinical (Observational Medical Outcomes Partnership [OMOP]-formatted EHR data), genomics (somatic), and imaging data on the blockchain. Stewards representing the affiliated institution then upload the data to CGT. Researchers, clinicians, patients, and the public can then retrieve the data through the Web or interface, with the data dynamically available through the PatientExploreR-CGT app.</p>
        </sec>
        <sec>
          <title>Genomic Data Collection</title>
          <p>Somatic gene sequencing of tumor specimens was ordered by the supervising physician (EC) as standard of care using either a commercial (Foundation Medicine; FMI [<xref ref-type="bibr" rid="ref28">28</xref>]) or in-house panel (UCSF 500) [<xref ref-type="bibr" rid="ref29">29</xref>]; 13 patients were sequenced and analyzed by Foundation Medicine [<xref ref-type="bibr" rid="ref30">30</xref>] and 4 patients by the UCSF 500 [<xref ref-type="bibr" rid="ref31">31</xref>] genomic panel. In the case of Foundation Medicine, we received the patient’s report in XML format. In the case of the UCSF 500, we requested a deidentified variant call file from the UCSF genomic stewards.</p>
        </sec>
        <sec>
          <title>Image Data Collection</title>
          <p>For patients with available radiograph imaging, we obtained deidentified DICOM files from the UCSF’s Picture Archiving and Communication System medical imaging system conforming to Supplement 142: Clinical Trial De-identification Basic Profile, which removes any identifying protected health information (PHI) from the images as well as any accompanying metadata. Pathology slides were obtained for each patient who had associated pathology performed at UCSF. Deidentified computed tomography (CT) and positron-emission tomography-CT scans correlating to significant changes in tumor response were uploaded for 3 patients to the CGT. Scanned pathology slides clinically utilized for diagnostic purposes were uploaded for 2 of these patients. These deidentified imaging data can be viewed publicly in their entirety on the CGT and illustrate an example collection of raw (but deidentified), clinically relevant data for public research use. Phillips scanners were used to digitize the pathology slides, and a review of PHI was completed before uploading onto CGT.</p>
        </sec>
        <sec>
          <title>Clinical Electronic Health Record Data Collection</title>
          <p>A large aspect of this project was to evaluate the most suitable and robust source of clinical data to share on CGT. For this comparison, we compared UCSF Cancer registry data, collected to meet the specifications of the Surveillance, Epidemiology, and End Results (SEER) Program, with Observational Health Data Sciences and Informatics (OHDSI) OMOP common data model (CDM) extracted from the hospital EHR. The OMOP CDM is emerging as a standard in the field of EHR research because it is a common framework in terms of both table structure and underlying vocabulary [<xref ref-type="bibr" rid="ref32">32</xref>] and has enabled powerful research and a venue for regulatory reporting [<xref ref-type="bibr" rid="ref33">33</xref>].</p>
          <p>SEER is a national registry for cancer reporting and provides specific guidelines for data collection from the EHR [<xref ref-type="bibr" rid="ref34">34</xref>]. Before SEER submission, cancer registry data are submitted to the state registry and assessed for data quality and consolidation with other records for the same patient. Registry data are collected on every cancer case admitted to a UCSF hospital for either diagnosis and/or first course or subsequent cancer treatment per California state cancer reporting law. Certified Tumor Registrars abstract and code cancer information from the EHR in a format specified by the North American Association of Central Cancer Registries’ Data Standards [<xref ref-type="bibr" rid="ref35">35</xref>]. The data collection and coding rules for data collection are specified by the SEER Program Manual and fully abstracted within 6 months of patients’ date of first contact with the hospital.</p>
        </sec>
        <sec>
          <title>Registry Format</title>
          <p>For the first 18 patients, clinical data were requested from the cancer registrar’s office for curated data for ultimate submission to SEER via the CNExT cancer registry software. For each patient, we received an Excel export from CNExT with curated clinical data fields (<xref ref-type="table" rid="table1">Table 1</xref>). We developed a client-side single-page Web application that read in this Excel file on the research coordinators computer, filtered PHI to ensure compliance with IRB regulatory guidelines, and generated a deidentified JSON file. The primary investigator and research coordinator personally reviewed each deidentified registry file for PHI before uploading onto CGT. Depending on the timing of the patient’s presentation to the hospital relative to genetic testing, the registry data collection could be in either an incomplete <italic>suspense</italic> state or a completed abstract. Minimum data collection in a suspense case comprises patient age, gender, date of first contact, primary site, and histology. Complete cases contained additional data items related to Basis of Diagnosis and Therapeutic Agent.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Breakdown of data elements for registry/Observational Medical Outcomes Partnership.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="280"/>
              <col width="270"/>
              <col width="450"/>
              <thead>
                <tr valign="top">
                  <td>Gold Standard EHR<sup>a</sup></td>
                  <td>Registry field</td>
                  <td>OMOP table.column</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Gender</td>
                  <td>Sex</td>
                  <td>person.gender_concept_id</td>
                </tr>
                <tr valign="top">
                  <td>Ethnicity</td>
                  <td>Spanish Origin</td>
                  <td>person.ethnicity_concept_id </td>
                </tr>
                <tr valign="top">
                  <td>Race</td>
                  <td>Race</td>
                  <td>person.race_concept_id</td>
                </tr>
                <tr valign="top">
                  <td>Date of Diagnosis</td>
                  <td>Date of Diagnosis<sup>b</sup></td>
                  <td>condition_occurrence. condition_start_date</td>
                </tr>
                <tr valign="top">
                  <td>Basis of Diagnosis </td>
                  <td>Dx Confimation DX Staging/Proc Summ<sup>b</sup></td>
                  <td>procedure_occurrence. procedure_occurrence_id</td>
                </tr>
                <tr valign="top">
                  <td>Cancer Site</td>
                  <td>Cancer Site ICD-0-3 SEER<sup>c</sup> Site Group</td>
                  <td>condition_occurrence. condition_concept_id</td>
                </tr>
                <tr valign="top">
                  <td>Cancer Histology/Morphology</td>
                  <td>Cancer Histology (ICD-0-3)</td>
                  <td>condition_occurrence. condition_concept_id</td>
                </tr>
                <tr valign="top">
                  <td>Therapeutic Agent/Modality</td>
                  <td>Text/Code of Chemo At Hospital<sup>b</sup></td>
                  <td>drug_exposure. drug_concept_id</td>
                </tr>
                <tr valign="top">
                  <td>Beginning and End Dates of Treatment</td>
                  <td>Chemo Start Date/Chemo End Date<sup>b</sup></td>
                  <td>drug_exposure. drug_exposure_start_date/drug_exposure. drug_exposure_end_date</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>EHR: electronic health record.</p>
              </fn>
              <fn id="table1fn2">
                <p><sup>b</sup>Indicates that the field is listed but no or incomplete information was populated (ie, “suspense” registry cases).</p>
              </fn>
              <fn id="table1fn3">
                <p><sup>c</sup>SEER: Surveillance, Epidemiology, and End Results.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Observational Medical Outcomes Partnership Format</title>
          <p>Procuring clinical data from OMOP was a different process as it involved extraction of retrospective, routinely collected data from the EHR. The Enterprise Data Warehouse (EDW) team at UCSF is responsible for converting raw EPIC/Clarity data into the OMOP format and acted as an honest broker for this extraction process. First, we selected the tables and fields that corresponded to data elements we were consented to collect from our IRB, with buy-in from the EDW team (<xref ref-type="table" rid="table1">Table 1</xref>). No free-text fields were included. We then provided the medical record numbers (MRNs), and their corresponding CGT patient IDs, to the EDW team who then performed the deidentification process for 17 patients with available data, removing all PHI (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> and below for more details). The EDW then extracted the data in the agreed-upon columns in 6 tables of interest, specifically: person, drug_exposure, condition_occurrence, procedure_occurrence, and measurement. We then performed a secondary check to verify all data were deidentified (see below), and then transformed the files (saved as TSV) into a single JSON file per patient.</p>
        </sec>
      </sec>
      <sec>
        <title>Clinical Data Scoring Methodology</title>
        <p>We evaluated all patients’ registry and OMOP data for completeness based on a scoring rubric we designed (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for full details) relating to certain gold-standard metrics essential for clinical data sharing (<xref ref-type="table" rid="table1">Table 1</xref>), inspired by Conley et al [<xref ref-type="bibr" rid="ref11">11</xref>]. Data from these gold-standard metrics were captured from the <italic>true</italic> data recorded in UCSF EPIC EHR system patient records. Next, reviewers evaluated how much of these data could be identified from registry and OMOP data sources. Of the 29 data elements recommended by Conley et al [<xref ref-type="bibr" rid="ref11">11</xref>], we were able to capture 10 of these due to their ability to be obtained without curation from OMOP and registry clinical pipelines. Simply, these data were evaluated on a scale from 0 to 5 for registry and OMOP data, with 0 representing no presence of the data element in the corresponding modality and 5 representing complete representation (values in between correspond to 20% increments of how complete the representation is). As such, for the 10 data elements, the maximum score a patient can receive per data modality is 50.</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <p>To assess whether there was any significant difference between registry vs OMOP in terms of data quality capture, we performed a 2-sided Wilcoxon signed-rank test for all 17 patients who were scored according to the above methodology. We further assessed whether there was any difference at the field level, by performing the same assessment per data element (eg, Gender information). We hypothesized that although these two systems are different in terms of data collection methodologies, there should be no significant difference in total scores as both systems are organized to capture the same type of clinical data.</p>
      </sec>
      <sec>
        <title>Data Deidentification Procedures</title>
        <p>We strived to conform to the most rigorous standards for proper deidentification of all data released as determined by Health Insurance Portability and Accountability Act (HIPAA) standards (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for further discussion and complete documentation of this process).</p>
        <p>For the OMOP EHR data, all PHI was removed on receiving the data from the honest broker, the EDW. In these files, all dates were converted into age in days since birth. We performed a secondary check to manually verify that no PHI remained in the files. For genomic data, all germ-line mutations were removed, leaving only somatic variants. No further processing was required for the DICOM images that conform to Supplement 142. Pathology scans were exported into JPEG image files with no identifying metadata or information in the image. The single-page Web application generates a UUID for every patient. The institution and CGT steward maintain an appendix of CGT IDs and UCSF MRNs to preserve the possibility of reidentification between qualified clinicians for follow-up and further research [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
      </sec>
      <sec>
        <title>Data Export and Sharing</title>
        <p>These deidentified files are uploaded to the off-blockchain store (IPFS) [<xref ref-type="bibr" rid="ref25">25</xref>]. The off-blockchain store calculates a cryptographically strong hash (SHA-256) of the entire submission that is added to the stewards list of submissions, which is then updated in the off-blockchain store. This final step yields an updated top level cryptographically strong hash that uniquely defines the entire state of all submissions from the steward at that point in time. This final top-level hash is then submitted to the blockchain as provenance for the entire corpus of submissions from the institution. As the hash is only 256 bits in size, the cost to add to a blockchain is minimized with the bulk of the data stored uniquely in the off-blockchain store. Individual submission hashes as well as the overall steward hash may be concisely referenced toward reproducing any downstream analysis.</p>
      </sec>
      <sec>
        <title>Data Distribution and Access</title>
        <p>Submissions including all data are immediately available from any IPFS server on the internet via the submission hash. IPFS is inherently decentralized and distributed. Any node may request data from any other node via the unique hash of the data and cache it locally. An IPFS server when queried for the data associated with a hash returns it if it has it locally stored, and if not asks all of the servers it is connected to for the data. In spirit, this is similar to the Transmission Control Protocol/Internet Protocol layer of the internet whereby if a router does not talk directly to the destination it checks with all of its direct peers to see if they do. As a result, data are duplicated as a side effect of access affording organic replication and scalable access. IPFS servers speak HTTP and therefore any data can be accessed in a browser or with a few lines of code from standard bioinformatics analysis tools (eg, cBio, Galaxy, and Jupyter).</p>
      </sec>
      <sec>
        <title>PatientExploreR-Cancer Gene Trust: Data Visualization</title>
        <p>To facilitate interaction with CGT, we adapted a visualization application to browse, search, visualize, and download the clinical and genomic data shared on CGT. This application, called PatientExploreR-CGT, is adapted from our original PatientExploreR version [<xref ref-type="bibr" rid="ref37">37</xref>]. PatientExploreR-CGT automatically pulls and maps all data from CGT into a user-friendly dashboard. This application is built in R (version 3.4.1) using the Shiny [<xref ref-type="bibr" rid="ref38">38</xref>] (version 1.0.5) framework and directly interfaces with OMOP-formatted (version 5 or later) EHR data. In the front-end, the following Shiny-related packages are utilized: shinyWidgets [<xref ref-type="bibr" rid="ref39">39</xref>], shinyjs [<xref ref-type="bibr" rid="ref40">40</xref>], shinyalert [<xref ref-type="bibr" rid="ref41">41</xref>], shinycssloaders [<xref ref-type="bibr" rid="ref42">42</xref>], shinyBS [<xref ref-type="bibr" rid="ref43">43</xref>], and shinythemes [<xref ref-type="bibr" rid="ref44">44</xref>]. Visualizations were created using the plotly [<xref ref-type="bibr" rid="ref45">45</xref>] and timevis [<xref ref-type="bibr" rid="ref46">46</xref>] packages. In its backend, PatientExploreR-CGT makes use of ROMOP [<xref ref-type="bibr" rid="ref47">47</xref>] to automatically extract and map pertinent concepts across all relevant tables (eg, person, observation, and condition occurrence). Data processing and manipulation were facilitated by data.table [<xref ref-type="bibr" rid="ref48">48</xref>], DT [<xref ref-type="bibr" rid="ref49">49</xref>], rjson [<xref ref-type="bibr" rid="ref50">50</xref>], and dplyr [<xref ref-type="bibr" rid="ref51">51</xref>]. This app can be freely accessed [<xref ref-type="bibr" rid="ref52">52</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Cancer Gene Trust Pilot Study</title>
        <p>We provide the demographics of the pilot cohort in <xref ref-type="table" rid="table2">Table 2</xref>. In our cohort, the breakdown of primary cancer was as follows: seven with pancreatic adenocarcinoma, four with cholangiocarcinoma, and one each with anal squamous carcinoma, gastric cancer, colon cancer, gastrointestinal stromal tumor, cecal cancer, and metastatic cancer of unknown primary origin. An additional patient also had metastatic cancer of unknown primary origin but without EHR data. We provide a breakdown of all such data by patient and modality in <xref ref-type="table" rid="table3">Table 3</xref>.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Cohort demographics and clinical information. Demographic breakdown of clinical pilot cohort.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="470"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Modality</td>
                <td>Value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Gender, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td>6 (33)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>12 (67)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Race, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>White</td>
                <td>11 (61)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Asian</td>
                <td>5 (28)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unknown</td>
                <td>2 (11)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Ethnicity, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hispanic/Latino</td>
                <td>2 (11)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Not Hispanic/Latino</td>
                <td>16 (89)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Status, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Alive</td>
                <td>15 (83)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Deceased</td>
                <td>3 (17)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Age (years), mean (SD)</td>
                <td>59.3 (13.3)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Breakdown of Cancer Gene Trust data by patient and modality.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="310"/>
            <col width="80"/>
            <col width="70"/>
            <col width="50"/>
            <col width="100"/>
            <col width="50"/>
            <col width="90"/>
            <col width="90"/>
            <col width="100"/>
            <col width="60"/>
            <thead>
              <tr valign="top">
                <td>CGT<sup>a</sup></td>
                <td colspan="2">Clinical</td>
                <td colspan="2">Genomics</td>
                <td colspan="2">Imaging</td>
                <td colspan="3">OMOP<sup>b</sup> data breakdown</td>
              </tr>
              <tr valign="top">
                <td>CGT Public UUID<sup>c</sup></td>
                <td>Registry</td>
                <td>OMOP</td>
                <td>FMI<sup>d</sup></td>
                <td>UCSF<sup>e</sup> 500</td>
                <td>CT<sup>f</sup></td>
                <td>Pathology</td>
                <td>Conditions</td>
                <td>Procedures</td>
                <td>Drugs</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>f9b6a782-bbf5-4be8-bf7e-d1a9586d9552</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A<sup>g</sup></td>
                <td>N/A</td>
                <td>N/A</td>
                <td>1597</td>
                <td>1190</td>
                <td>3661</td>
              </tr>
              <tr valign="top">
                <td>c2e2e081-4c39-4201-8a27-7b469ed39490</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>✓</td>
                <td>✓</td>
                <td>1350</td>
                <td>969</td>
                <td>2088</td>
              </tr>
              <tr valign="top">
                <td>db2d85aa-4f94-4e77-8755-6b94a710c1aa</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>✓</td>
                <td>✓</td>
                <td>2389</td>
                <td>1394</td>
                <td>3086</td>
              </tr>
              <tr valign="top">
                <td>2fbc25da-3965-49c4-866f-72cf0abc2417</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>930</td>
                <td>654</td>
                <td>1174</td>
              </tr>
              <tr valign="top">
                <td>940171e7-d358-463a-8d9a-2b2fa90c2a84</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>1179</td>
                <td>624</td>
                <td>1388</td>
              </tr>
              <tr valign="top">
                <td>f0314175-2d19-4146-8754-fc5aed3ab420</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>511</td>
                <td>405</td>
                <td>549</td>
              </tr>
              <tr valign="top">
                <td>c7dbcfac-37ea-43f8-8899-1a9f2fb56341</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>216</td>
                <td>114</td>
                <td>184</td>
              </tr>
              <tr valign="top">
                <td>ef5c3164-6f45-4d3a-88f0-4509226c5571</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>51</td>
                <td>14</td>
                <td>57</td>
              </tr>
              <tr valign="top">
                <td>ec3d977b-c310-4df3-a444-f79bc3dd8b58</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>811</td>
                <td>505</td>
                <td>776</td>
              </tr>
              <tr valign="top">
                <td>131cf62d-ad78-49c1-a699-5bcc1004cd12</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>155</td>
                <td>42</td>
                <td>110</td>
              </tr>
              <tr valign="top">
                <td>cf11c31c-f4c3-48ba-9c46-66f406d0b7a1</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>311</td>
                <td>162</td>
                <td>131</td>
              </tr>
              <tr valign="top">
                <td>ccc2ba97-912f-4b62-b767-cca129ee6a56</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>51</td>
                <td>10</td>
                <td>60</td>
              </tr>
              <tr valign="top">
                <td>104ec531-5d95-41e2-ac72-f6cff2006b8e</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>36</td>
                <td>10</td>
                <td>17</td>
              </tr>
              <tr valign="top">
                <td>a5627ac3-450d-4036-ade8-99ae62a5c232</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>857</td>
                <td>439</td>
                <td>805</td>
              </tr>
              <tr valign="top">
                <td>5189efbe-3382-4353-ad2f-9afd0255c2c8</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>875</td>
                <td>276</td>
                <td>674</td>
              </tr>
              <tr valign="top">
                <td>253f0e2d-bebd-464b-81c5-8dd8385192b3</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>117</td>
                <td>116</td>
                <td>217</td>
              </tr>
              <tr valign="top">
                <td>d199cfb0-91e8-471d-b1b3-53189cd64ee0</td>
                <td>✓</td>
                <td>✓</td>
                <td>✓</td>
                <td>N/A</td>
                <td>✓</td>
                <td>N/A</td>
                <td>21</td>
                <td>11</td>
                <td>81</td>
              </tr>
              <tr valign="top">
                <td>5d3205a3-28c4-45eb-bfd8-b32d67c3be0f</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>N/A</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>CGT: Cancer Gene Trust.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>OMOP: Observational Medical Outcomes Partnership.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>UUID: universally unique identifier.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>FMI: Foundation Medicine.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>UCSF: University of California, San Francisco</p>
            </fn>
            <fn id="table3fn6">
              <p><sup>f</sup>CT: computed tomography.</p>
            </fn>
            <fn id="table3fn7">
              <p><sup>g</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Breakdown of Available Data in Cancer Gene Trust by Patient</title>
        <p>The CGT Public ID refers to the globally unique hexadecimal identifier per patient. ✓ indicates that data are available for that particular modality per patient. For the OMOP data, the numbers reflect how many data elements are available per modality.</p>
      </sec>
      <sec>
        <title>Genomic Breakdown of Cancer Gene Trust Cohort of Patients With Foundation One Reports</title>
        <p>Of patients with genomic data, the majority (n=13) had Foundation One sequencing performed and, as such, we focus on these data for a breakdown analysis (<xref rid="figure2" ref-type="fig">Figure 2</xref>). Across all patients, we identified 139 mutations in 95 genes (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). On average, patients had 10.69 (SD 5.34) somatic variants, with the most being 21 and the fewest being 3, across different current knowledge status (ie, known pathogenic, likely pathogenic, or of unknown consequence; panel A). On average, these somatic variants were primarily unknown (panel B left), with a mean of 8.07 (SD 4.57) per patient. Patients had an average of 2.18 (SD 0.98) of known and 1.43 (SD 0.79) likely variants. In terms of their functional effect, the majority of variants were missense (83.5% (116/139), panel B right). These patients had various primary diseases, the most prevalent being pancreatic (n=4, panel C left). For these patients, biopsies were taken from various tissues of origin, the most prevalent being liver (n=5, panel C right). Please refer to <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for a diagram illustrating connections between tissue of origin and primary disease for these patients. We further break down the functional effect and status of variants by tissue of origin and primary disease in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. These, of course, should be considered in context to the number of patients by tissue of origin and primary disease. With these considerations, we still found some interesting trends. For instance, lymph node tissue of origin (n=1 patient) had the fewest variants (n=3) with no known pathological variants, whereas omentum tissue of origin had the most for a single patient (n=21) with three known pathological variants. Of course, these trends could depend on patient-specific or severity variations, and will require more patient data.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Breakdown of Foundation One genomics results for pilot cohort. (A) The breakdown of number of variants reported per patient stratified by their current knowledge status. (B) Breakdown of all variants for patients by effect (left) current knowledge status (right). (C) Distribution of cancer type per patient by primary disease (left) and tissue of origin (right). (D) Distribution of genes based on the current knowledge status of encompassed variants. (E) List of the most commonly recurrently mutated genes (N&#62;1) by number of encompassed variants by status. Black dots represent number of unique patients with a variant in the gene.</p>
          </caption>
          <graphic xlink:href="jmir_v22i3e16810_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Across all patients, the 95 genes contained variants with various levels of knowledge status, including overlapping domains if there were more than one variant identified per gene (panel D). Here, we also see that the majority of genes had variants of unknown significance (n=82). There were 10 genes that contained multiple variants of different knowledge classes. The most commonly mutated genes across individuals (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> and panel E, black dots) were KRAS and TP53 (n=5) followed by ARID1A and MLL2 (n=4). In a similar vein, MLL2 has the most unique variants identified (n=6 variants across 4 patients), followed by KRAS and TP53 (n=5 variants across 5 patients). The majority of genes with more than one carrier contained variants of unknown significance only (54% (14/26)), further exemplifying the need for combining real-world EHR with such genomic data. We further visualize the landscape of variants of unknown significance by effect overall and on a per-patient level in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. We notice that for 1 patient with pancreatic cancer and tissue biopsy, for instance, there is one nonsense mutation in TGFBR2 with a current unknown knowledge status. According to TCGA GDC data portal, there are only 15 cases of primary site pancreatic cancer (TCGA-PAAD) with variants in this gene, and only two are stop-gain. Sharing data such as these with other researchers could quickly expand current knowledge status of variants and their association with disease.</p>
      </sec>
      <sec>
        <title>Comparing Robustness of Clinical Data Procedures</title>
        <p>To identify the most robust format of clinical data to share on CGT, we assessed whether there was a significant difference in scoring quality between two disparate data formats, specifically the prospectively collected registry and retrospectively gathered OMOP. We hypothesized that there would be no overall difference in scoring quality because both methodologies in theory should capture the main core competencies of interest.</p>
        <p>Although we found that total score across all patients and data elements were higher for registry compared with OMOP (<xref ref-type="table" rid="table4">Table 4</xref>; 642 vs 560), this difference was not statistically significant (<italic>P</italic>=.13, V=44).We further analyzed any significant discrepancies by core competency data element (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>; <xref ref-type="table" rid="table1">Table 1</xref> for element descriptions and source).We found no significant difference for Gender (<italic>P</italic>=.35, V=3), Ethnicity (<italic>P</italic>=.17, V=6), Race (<italic>P</italic>=.17, V=13), Year of Birth (<italic>P</italic>=.35, V=3), Basis of Diagnosis (<italic>P</italic>=.66, V=45), Cancer Site (<italic>P</italic>=.09, V=0), Therapeutic Agent/Modality (<italic>P</italic>=.17, V=21), and Beginning and End Dates of Treatment (<italic>P</italic>=.47, V=20). We did find, however, that there was a significant difference between OMOP and registry scoring for Date of Diagnosis (<italic>P</italic>=.004, V=0), with registry having higher scores (<italic>P</italic>=.002, V=0), and Cancer Histology (<italic>P</italic>=.0004, V=0), with registry having higher scores (<italic>P</italic>&#60;.001, V=0). See <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for per patient, per element scores for registry and OMOP, respectively.</p>
        <p>Break down of <italic>gold standard</italic> elements and their respective fields in registry and OMOP is given in <xref ref-type="table" rid="table4">Table 4</xref>.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Overall patient scores for registry vs Observational Medical Outcomes Partnership formats.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="430"/>
            <col width="290"/>
            <col width="280"/>
            <thead>
              <tr valign="top">
                <td>Patient</td>
                <td>Registry</td>
                <td>OMOP<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>f9b6a782-bbf5-4be8-bf7e-d1a9586d9552</td>
                <td>39</td>
                <td>28</td>
              </tr>
              <tr valign="top">
                <td>c2e2e081-4c39-4201-8a27-7b469ed39490</td>
                <td>41</td>
                <td>34</td>
              </tr>
              <tr valign="top">
                <td>db2d85aa-4f94-4e77-8755-6b94a710c1aa</td>
                <td>42</td>
                <td>32</td>
              </tr>
              <tr valign="top">
                <td>2fbc25da-3965-49c4-866f-72cf0abc2417</td>
                <td>48</td>
                <td>30</td>
              </tr>
              <tr valign="top">
                <td>940171e7-d358-463a-8d9a-2b2fa90c2a84</td>
                <td>31</td>
                <td>41</td>
              </tr>
              <tr valign="top">
                <td>f0314175-2d19-4146-8754-fc5aed3ab420</td>
                <td>29</td>
                <td>39</td>
              </tr>
              <tr valign="top">
                <td>c7dbcfac-37ea-43f8-8899-1a9f2fb56341</td>
                <td>15</td>
                <td>33</td>
              </tr>
              <tr valign="top">
                <td>ef5c3164-6f45-4d3a-88f0-4509226c5571</td>
                <td>50</td>
                <td>29</td>
              </tr>
              <tr valign="top">
                <td>ec3d977b-c310-4df3-a444-f79bc3dd8b58</td>
                <td>35</td>
                <td>33</td>
              </tr>
              <tr valign="top">
                <td>131cf62d-ad78-49c1-a699-5bcc1004cd12</td>
                <td>35</td>
                <td>33</td>
              </tr>
              <tr valign="top">
                <td>cf11c31c-f4c3-48ba-9c46-66f406d0b7a1</td>
                <td>47</td>
                <td>29</td>
              </tr>
              <tr valign="top">
                <td>ccc2ba97-912f-4b62-b767-cca129ee6a56</td>
                <td>13</td>
                <td>33</td>
              </tr>
              <tr valign="top">
                <td>104ec531-5d95-41e2-ac72-f6cff2006b8e</td>
                <td>35</td>
                <td>24</td>
              </tr>
              <tr valign="top">
                <td>a5627ac3-450d-4036-ade8-99ae62a5c232</td>
                <td>45</td>
                <td>34</td>
              </tr>
              <tr valign="top">
                <td>5189efbe-3382-4353-ad2f-9afd0255c2c8</td>
                <td>47</td>
                <td>38</td>
              </tr>
              <tr valign="top">
                <td>253f0e2d-bebd-464b-81c5-8dd8385192b3</td>
                <td>46</td>
                <td>37</td>
              </tr>
              <tr valign="top">
                <td>d199cfb0-91e8-471d-b1b3-53189cd64ee0</td>
                <td>44</td>
                <td>33</td>
              </tr>
              <tr valign="top">
                <td>Total</td>
                <td>642</td>
                <td>560</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>OMOP: Observational Medical Outcomes Partnership.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Total score per patient per data modality, specifically registry vs OMOP, compared with <italic>gold standard</italic> raw EHR data. Each score is the sum of all elements analyzed. Patient scores broken down by element can be found in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
      </sec>
      <sec>
        <title>Developing a Clinical Narrative From Cancer Gene Trust Data</title>
        <p>Although safely, securely, and robustly sharing clinically related patient data is an important procedure in and of itself, we want to demonstrate the power of this framework by compiling a clinical narrative solely from data shared on CGT. We elected to use patient c2e2e081-4c39-4201-8a27-7b469ed39490 as a highlighted example (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for all relevant CGT hash information for this patient). We further show how to identify these data points using PatientExploreR-CGT in the following section.</p>
        <disp-quote>
          <p>On Day 1 (26,346 days from birth), patient underwent laparoscopic cholecystectomy (at a prior institution) which confirmed moderately differentiated adenocarcinoma with mucinous features. On day 42 (26,387), pathology was reviewed at UCSF which confirmed stage at pT2Nx. On Day 75 (26,420), patient underwent open partial hepatectomy, portal lymphadenectomy, and appendectomy. An FNA of RUQ skin nodule at prior trochar site on Day 195 (26,540) identified adenocarcinoma consistent with recurrence/metastasis from primary gallbladder site. CT C/A/P on Day 196 (26,540) showed multiple new peritoneal and ventral abdominal wall soft tissue nodules suspicious for metastases.</p>
        </disp-quote>
        <disp-quote>
          <p>Patient signed informed consent for CC#16457 clinical trial on Day 238 (26,583) andcompleted baselinescans on Day 244 (26,589; <xref rid="figure3" ref-type="fig">Figure 3</xref>E [left]; hash ids: QmaYX3YvzDrendfcfnK1otff1kw88stxWM8 XMUdsXXKSHP [parent], Qmd7V8hS2mCtup RLYk6Qm2AMHyk6X7Y4QPTDqZe7UCUnUT [image]) which showed unchanged disease from Day 196. Patient randomized to Arm B: merestinib/placebo + cisplatin + gemcitabine (not available in OMOP data) on Day 257 (26,602) and completed Cycle 1, Day 1 cisplatin + gemcitabine on Day 260 (26,605). On Day 286 (26,631), Cycle 2, Day 8 cisplatin + gemcitabine was completed.</p>
        </disp-quote>
        <disp-quote>
          <p>On Day 300, a CT C/A/P was performed (26,645; <xref rid="figure3" ref-type="fig">Figure 3</xref>E [right]; hash ids: QmQ6PtwhTM qw9b3SFsa1qfW79kGK7tPrhrUHpKVLtxmj1i [parent], QmZmVEsqNeCDuzUDDvLWYUdbxQ2QZ ehDhkdzyCNvX8gFJF [image]) and showed stable scattered abdominal wall, peritoneal and retroperitoneal implants. Interval progression of mild intrahepatic biliary dilatation, possibly due to new soft tissue prominence at the porta hepatis, concerning for recurrence. However, unchanged small upper lobe pulmonary nodules were noted and stable disease was concluded per RECIST, with 18.18% decrease in sum of target lesion diameters.</p>
        </disp-quote>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>PatientExploreR visualization app for Cancer Gene Trust (CGT). Breakdown of features available for the public PatientExploreR visualization application for CGT. (A) Landing page which has all options for browsing patients, exploring patient data, and information about CGT. This page also displays the amount of data currently compiled on CGT. (B) Browse tab for filtering for patient based on clinical concepts and/or demographics. This list is filtered by Gallbladder-related disease and patient c2e2e081-4c39-4201-8a27-7b469ed39490 was selected. (C) Explore tab that details patient’s background and clinical summary. The user can interact with clinical, genomic, and imaging data for selected patient. These data can be filtered and exported and control what is shown visually in the timeline view below. (D) Genomics data extracted and displayed from either the Foundation One or UCSF 500 report. (E) Two sample image scans that can be found via the imaging submenu or from clicking within the timeline view below. These CT scans show baseline and C3D1, 26,589 and 26,645 age in days, respectively. Baseline contrast enhanced CT of the abdomen shows a peritoneal metastasis (arrow) measuring 12×8 mm. Posttreatment contrast enhanced CT of the abdomen shows decreased size of the peritoneal metastasis (arrow) measuring 10×6 mm. (F) Timeline view of selected clinical and image data. This timeline view was produced by selecting the associated relevant medications in the Drug pull-down menu, specifically: capecitabine, cisplatin, fluorouracil, and trastuzumab. With Show Images selected, we can see what relevant medications the patient was prescribed when the images were taken. Pressing the link next to Value above, the user will be directed to all images taken during that visit, which can be viewed on an appropriate (eg, DICOM viewer) browser.</p>
          </caption>
          <graphic xlink:href="jmir_v22i3e16810_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Exploring Cancer Gene Trust Data on PatientExploreR-Cancer Gene Trust</title>
        <p>To further operationalize the CGT framework, we adapted an application called PatientExploreR to seamlessly interface with CGT to effectively explore, visualize, and download the data. We envision this application to be particularly useful for individuals without much data extraction and manipulation experience. This application requires no registration and is publicly available [<xref ref-type="bibr" rid="ref52">52</xref>]. PatientExploreR-CGT pulls all OMOP data from CGT, maps all clinical concepts according to the CDM, and provides convenient links to genomic data as well as image data in the context of their clinical history. In <xref rid="figure3" ref-type="fig">Figure 3</xref>, we demonstrate the power of the visualization by showing a detailed timeline of the above patient’s treatment timeline around the time of the available CT scans.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Overview</title>
        <p>In this study, we have consented patients in an IRB-approved process to share deidentified EHRs, genomic, and imaging data using a blockchain-authenticated framework called CGT. Our goal of this pilot study was to demonstrate the process of patient consent to data sharing within a large public health institution as well as to create a framework that can facilitate other institutions, physicians, and patients to add their own data. The benefit of a block-chain authenticated system was more geared to decentralized access (authorization) rather than privacy or security (authentication) as all submissions are public by design. As we hypothesized, all 18 patients in the pilot study did not have reservations about sharing their data, which has been similarly demonstrated [<xref ref-type="bibr" rid="ref9">9</xref>], and we believe patients from other institutions have similar beliefs. Patient privacy was a top priority for this project and we actively coordinated the highest-standards for deidentification processing of all data shared (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for deidentification process).</p>
        <p>In designing the CGT, we had to overcome the existing challenges in this space, namely that this framework should be secure, efficient, and scalable while being cost-efficient, open to the public, and not owned by a single institution. We also had to determine not only which data should be shared but also the appropriate format of such data that would balance interoperability with speed of sharing. Our pilot also addresses cultural and institutional challenges, both perceived and real, including the IRB, patient consent and education, and other elements.</p>
        <p>CGT is designed as an alternate approach to centralized data repository platforms such as Medical Information Mart for Intensive Care [<xref ref-type="bibr" rid="ref53">53</xref>] which have enabled a slew of powerful research. Unlike these primarily static databases, CGT can facilitate rapid and continual data being shared from the clinical care system as close to the time of generation and extraction as possible. Both systems have their merits and hopefully they will be complementary in providing access to deidentified EHR data to enable personalized medicine. Furthermore, CGT enables researchers to use and interpret medical data instead of resolving disparate access methods from multiple sources or failing entirely because data are simply not available in any format. Indeed, it is our hope that CGT can facilitate research studies and enhance clinical care on a timescale not previously possible, while allowing data holders to maintain the privacy and security of individual data sources and the nonpublic subset of the data [<xref ref-type="bibr" rid="ref36">36</xref>]. At the same time, this entire process will respect individual patient consents and cultural data sharing preferences and expectations. CGT enables aggregation of data from all consenting patients. CGT might bolster cancer research and help physicians, patients, payers, and other stakeholders make more informed decisions about the increasingly complex diagnosis and treatment of cancer as well as its reimbursement. CGT functions as a bridge between the highly regulated HIPAA environment (<xref rid="figure1" ref-type="fig">Figure 1</xref>) and the open World Wide Web internet environment. To alleviate concerns about data ownership, CGT is built on a decentralized, democratized blockchain format and will remain free and open.</p>
      </sec>
      <sec>
        <title>Principal Findings</title>
        <p>Compared with a list of <italic>gold standard</italic> data elements [<xref ref-type="bibr" rid="ref11">11</xref>] that should be shared in such a project, we found that there was no significant difference in completeness between a prospectively collected registry and a retrospective (OMOP) procedure for clinical data. Certain data elements, however, were more robustly recorded in the registry format, specifically Date of Diagnosis and Cancer Histology. For analyses that aim to further personalized medicine, such pieces of information might be critical, and we hope the findings from this study can help improve the continually adapting OMOP model to better encode such information. These lapses could also be due to institution-specific extract, transform, load (ETL) procedures.</p>
        <p>Each strategy has its respective benefits and weaknesses. Because registry data are manually coded, specific key pieces of information can be easily highlighted and identified. Furthermore, for registry data to be submitted to SEER, all pieces of information must be detailed, but this process is manual and time consuming, and often results in different stages of aggregation per patient. As such, we found higher levels of variance in registry records compared with those in OMOP (mean 37.77, SD 10.87 vs mean 32.94, SD 4.26), which could reflect delays in manual data aggregation (ie, <italic>suspense</italic> states) or quality. It was clear though that more patients had more complete information from registry data than OMOP, with 5 patients having more than 90% completeness cores (ie, &#62;45 total score) in registry vs 0 in OMOP. However, by relying on the open source OMOP standard, instead of registry or a proprietary EHR structure, the barrier for distributing and sharing data is drastically lowered through reducing ETL transformation, which also lowers cost through leveraging the conversion processes already occurring in many hospital systems. Researchers recently demonstrated the power of OMOP for facilitating phenotype transfer across sites [<xref ref-type="bibr" rid="ref54">54</xref>], which aligns well with the goal of CGT. The additional costs of time are the clinical and regulatory tasks involved in consenting patients and obtaining, anonymizing, and uploading data. This process accounts for the majority of cost which will further decrease in high volume.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>There are many limitations of this study that need to be addressed. Both the registry and OMOP EHR extract did not contain all valuable and relevant core data elements. Therefore, the comparison of data robustness cannot be extended to all <italic>gold-standard</italic> elements that ideally should be shared in such a project. As OMOP is from retrospective extraction process, there is no immediate way to automatically identify primary cancer and therapeutic efficacy, although we hope this can be mediated by subsequent incorporation of deidentified notes or new schema adaptations or developments. Similar to any noncurated database, data quality for both registry and OMOP is limited by those who entered it and could be affected by infrastructural biases of individuals and EHR systems [<xref ref-type="bibr" rid="ref55">55</xref>]. In addition, the current framework is steward based, which means that there needs to be a single individual or team representative to submit data per institution. Similar to any cross-institution data link of deidentified data, there is no procedure in place to be able to map the same patient across stewards as there exists within the registry system. Although we tried to create a rule-based scoring system that is as unbiased as possible involving 2 separate reviewers, the manual scoring of data elements did contain levels of subjectivity and potential ambiguity, which is fully detailed in the <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <p>There are also risks of reidentification associated with data sharing, even beyond accidental leakage. Even for incomplete, fully deidentified data, for instance, a recent study was able to use generative copula-based method to accurately reidentify 99.98% of American individuals based on only 15 demographic attributes [<xref ref-type="bibr" rid="ref56">56</xref>]. Of course, many of these variables used in this paper are not available in this dataset, but it is important to note as other models might be developed in the future those could be applied to the data shared. Overall, these risks need to be weighed against the stagnation associated with keeping these valuable data siloed. Not sharing all details pertaining to treatment efficacy and adverse drug effects are not in the best interests of general public and overall scientific and medical community. Despite these limitations, open scientific data sharing has been an enormous boon in many fields and we believe that CGT presents a proof of concept that useful medical data can be openly shared. We further demonstrated the feasibility and utility of this process in a pilot study and provide fully detailed steps for other institutions to consent and add their patients’ data. The ultimate success of this platform will be determined by the flow of patient data and how it can be used to facilitate discoveries and help personalize treatment.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Each cancer case is unique and requires as much data as possible to inform ideal treatment decisions. The more data that exist and are released can help clinicians identify ideal personalized treatment for their patients. We found the OMOP CDM is a scalable format for dissemination, although it can be improved by better information in key data element fields such as cancer histology as compared with a prospectively collected registry format. The OHDSI Oncology Working Group [<xref ref-type="bibr" rid="ref12">12</xref>] is currently developing an extension to OMOP to support observational cancer research that better captures and records elements we found available in the registry format but not in the current OMOP implementation. We believe such an effort is invaluable to reconcile these differences and should be integrated into the future version of CGT. Put together, we hope that the CGT framework, pilot study, and interactive visualization application furthers the ideals of the cancer Moonshot project, unleashing data trapped in silos to further cancer research and reveal patterns that can help further personalize treatment.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplementary materials, including supplementary methods, figures, and tables.</p>
        <media xlink:href="jmir_v22i3e16810_app1.docx" xlink:title="DOCX File , 2909 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">CDM</term>
          <def>
            <p>common data model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CGT</term>
          <def>
            <p>Cancer Gene Trust</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CT</term>
          <def>
            <p>computed tomography</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">EDW</term>
          <def>
            <p>Enterprise Data Warehouse</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">ETL</term>
          <def>
            <p>extract, transform, load</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">HIPAA</term>
          <def>
            <p>Health Insurance Portability and Accountability Act </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">IPFS</term>
          <def>
            <p>InterPlanetary File System</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">IRB</term>
          <def>
            <p>institutional review board</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">MRN</term>
          <def>
            <p>medical record number</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">OHDSI</term>
          <def>
            <p>Observational Health Data Sciences and Informatics</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">OMOP</term>
          <def>
            <p>Observational Medical Outcomes Partnership</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">PHI</term>
          <def>
            <p>protected health information</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">SEER</term>
          <def>
            <p>Surveillance, Epidemiology, and End Results</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">UCSF</term>
          <def>
            <p>University of California, San Francisco</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">UUID</term>
          <def>
            <p>universally unique identifier</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We acknowledge the UCSF Academic Research Systems group for making available the deidentified OMOP data. We are grateful for Foundation Medicine for supplying XML files. We thank Boris Oskotsky for help setting up the server for PatientExploreR-CGT. We thank Atul Butte and Barbara Koening for helpful comments and Max Haeussler for the early technical inspiration. We also wish to thank Rachael Liao, Bartha Knoppers, Adrian Thorogood, and the Global Alliance for Genomics and Health (GA4GH) for their collaboration and guidance. BG was affiliated with the Bakar Computational Health Sciences Institute at the University of California, San Francisco, at the time of the study and is currently affiliated with the Hasso Plattner Institute for Digital Health at Mount Sinai within the Icahn School of Medicine at Mount Sinai. This publication was supported partially by the National Center for Advancing Translational Sciences, National Institutes of Health, through UCSF-CTSI [UL1 TR001872], National Cancer Institute of the National Institutes of Health under award numbers 5U24CA180951-04 and 5U24CA210974-02 to DH, as well as a Marcus Foundation Award to EC. TG graciously acknowledges support from the National Cancer Institute Oncology Model Forum project National Institutes of Health grant U24 CA195858.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schilsky</surname>
              <given-names>RL</given-names>
            </name>
          </person-group>
          <article-title>Personalized medicine in oncology: the future is now</article-title>
          <source>Nat Rev Drug Discov</source>
          <year>2010</year>
          <month>05</month>
          <volume>9</volume>
          <issue>5</issue>
          <fpage>363</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1038/nrd3181</pub-id>
          <pub-id pub-id-type="medline">20431568</pub-id>
          <pub-id pub-id-type="pii">nrd3181</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Iyer</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hanrahan</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Milowsky</surname>
              <given-names>MI</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Ahmadie</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Janakiraman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pirun</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sander</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Socci</surname>
              <given-names>ND</given-names>
            </name>
            <name name-style="western">
              <surname>Ostrovnaya</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Viale</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Heguy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Bochner</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bajorin</surname>
              <given-names>DF</given-names>
            </name>
            <name name-style="western">
              <surname>Berger</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Solit</surname>
              <given-names>DB</given-names>
            </name>
          </person-group>
          <article-title>Genome sequencing identifies a basis for everolimus sensitivity</article-title>
          <source>Science</source>
          <year>2012</year>
          <month>10</month>
          <day>12</day>
          <volume>338</volume>
          <issue>6104</issue>
          <fpage>221</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.sciencemag.org/cgi/pmidlookup?view=long&#38;pmid=22923433"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/science.1226344</pub-id>
          <pub-id pub-id-type="medline">22923433</pub-id>
          <pub-id pub-id-type="pii">science.1226344</pub-id>
          <pub-id pub-id-type="pmcid">PMC3633467</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sherman</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Gray</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Gross</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hunter</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>LaVange</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Marinac-Dabic</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Marks</surname>
              <given-names>PW</given-names>
            </name>
            <name name-style="western">
              <surname>Robb</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Shuren</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Temple</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Woodcock</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yue</surname>
              <given-names>LQ</given-names>
            </name>
            <name name-style="western">
              <surname>Califf</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Real-world evidence - what is it and what can it tell us?</article-title>
          <source>N Engl J Med</source>
          <year>2016</year>
          <month>12</month>
          <day>8</day>
          <volume>375</volume>
          <issue>23</issue>
          <fpage>2293</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1056/NEJMsb1609216</pub-id>
          <pub-id pub-id-type="medline">27959688</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Dudley</surname>
              <given-names>JT</given-names>
            </name>
          </person-group>
          <article-title>The next generation of precision medicine: observational studies, electronic health records, biobanks and continuous monitoring</article-title>
          <source>Hum Mol Genet</source>
          <year>2018</year>
          <month>05</month>
          <day>1</day>
          <volume>27</volume>
          <issue>R1</issue>
          <fpage>R56</fpage>
          <lpage>62</lpage>
          <pub-id pub-id-type="doi">10.1093/hmg/ddy114</pub-id>
          <pub-id pub-id-type="medline">29659828</pub-id>
          <pub-id pub-id-type="pii">4969371</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Norgeot</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>A call for deep-learning healthcare</article-title>
          <source>Nat Med</source>
          <year>2019</year>
          <month>01</month>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>14</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-018-0320-3</pub-id>
          <pub-id pub-id-type="medline">30617337</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-018-0320-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nwaru</surname>
              <given-names>BI</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Halamka</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Can learning health systems help organisations deliver personalised care?</article-title>
          <source>BMC Med</source>
          <year>2017</year>
          <month>10</month>
          <day>2</day>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>177</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedicine.biomedcentral.com/articles/10.1186/s12916-017-0935-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12916-017-0935-0</pub-id>
          <pub-id pub-id-type="medline">28965492</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12916-017-0935-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC5623976</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agarwala</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Khozin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Singal</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>O'Connell</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kuk</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gossai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Abernethy</surname>
              <given-names>AP</given-names>
            </name>
          </person-group>
          <article-title>Real-world evidence in support of precision medicine: clinico-genomic cancer data as a case study</article-title>
          <source>Health Aff (Millwood)</source>
          <year>2018</year>
          <month>05</month>
          <volume>37</volume>
          <issue>5</issue>
          <fpage>765</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1377/hlthaff.2017.1579</pub-id>
          <pub-id pub-id-type="medline">29733723</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adler-Milstein</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jha</surname>
              <given-names>AK</given-names>
            </name>
          </person-group>
          <article-title>Sharing clinical data electronically: a critical challenge for fixing the health care system</article-title>
          <source>J Am Med Assoc</source>
          <year>2012</year>
          <month>04</month>
          <day>25</day>
          <volume>307</volume>
          <issue>16</issue>
          <fpage>1695</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2012.525</pub-id>
          <pub-id pub-id-type="medline">22535851</pub-id>
          <pub-id pub-id-type="pii">307/16/1695</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mello</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Lieou</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Goodman</surname>
              <given-names>SN</given-names>
            </name>
          </person-group>
          <article-title>Clinical trial participants' views of the risks and benefits of data sharing</article-title>
          <source>N Engl J Med</source>
          <year>2018</year>
          <month>06</month>
          <day>7</day>
          <volume>378</volume>
          <issue>23</issue>
          <fpage>2202</fpage>
          <lpage>11</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29874542"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMsa1713258</pub-id>
          <pub-id pub-id-type="medline">29874542</pub-id>
          <pub-id pub-id-type="pmcid">PMC6057615</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beaulieu-Jones</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>ZS</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Byrd</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>CS</given-names>
            </name>
          </person-group>
          <article-title>Privacy-preserving generative deep neural networks support clinical data sharing</article-title>
          <source>Circ Cardiovasc Qual Outcomes</source>
          <year>2019</year>
          <month>07</month>
          <volume>12</volume>
          <issue>7</issue>
          <fpage>e005122</fpage>
          <pub-id pub-id-type="doi">10.1161/CIRCOUTCOMES.118.005122</pub-id>
          <pub-id pub-id-type="medline">31284738</pub-id>
          <pub-id pub-id-type="pmcid">PMC7041894</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Conley</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Dickson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zenklusen</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Al Naber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Messner</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Atasoy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chaihorsky</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Collyar</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Compton</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ferguson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Khozin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Kotte</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kurzrock</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Marino</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>McDonough</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>McNeal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Schilsky</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>LI</given-names>
            </name>
          </person-group>
          <article-title>Core clinical data elements for cancer genomic repositories: a multi-stakeholder consensus</article-title>
          <source>Cell</source>
          <year>2017</year>
          <month>11</month>
          <day>16</day>
          <volume>171</volume>
          <issue>5</issue>
          <fpage>982</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0092-8674(17)31254-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cell.2017.10.032</pub-id>
          <pub-id pub-id-type="medline">29149611</pub-id>
          <pub-id pub-id-type="pii">S0092-8674(17)31254-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="web">
          <source>OHDSI – Observational Health Data Sciences and Informatics</source>
          <access-date>2019-09-01</access-date>
          <comment>OHDSI Oncology Working Group<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ohdsi.org/web/wiki/doku.php?id=projects:workgroups:oncology-sg#">https://www.ohdsi.org/web/wiki/doku.php?id=projects:workgroups:oncology-sg#</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singal</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>PG</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwala</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kaushik</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Backenroth</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gossai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Frampton</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Torres</surname>
              <given-names>AZ</given-names>
            </name>
            <name name-style="western">
              <surname>Lehnert</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Bourque</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>O'Connell</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bowser</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Caron</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Baydur</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Seidl-Rathkopf</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ivanov</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Alpha-Cobb</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Guria</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Frank</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nunnally</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jaskiw</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Feuchtbaum</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nussbaum</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Abernethy</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>VA</given-names>
            </name>
          </person-group>
          <article-title>Association of patient characteristics and tumor genomics with clinical outcomes among patients with non-small cell lung cancer using a clinicogenomic database</article-title>
          <source>J Am Med Assoc</source>
          <year>2019</year>
          <month>04</month>
          <day>9</day>
          <volume>321</volume>
          <issue>14</issue>
          <fpage>1391</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30964529"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.2019.3241</pub-id>
          <pub-id pub-id-type="medline">30964529</pub-id>
          <pub-id pub-id-type="pii">2730114</pub-id>
          <pub-id pub-id-type="pmcid">PMC6459115</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shervey</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dudley</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Zimmerman</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Privacy-preserving methods for feature engineering using blockchain: review, evaluation, and proof of concept</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>08</month>
          <day>14</day>
          <volume>21</volume>
          <issue>8</issue>
          <fpage>e13600</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/8/e13600/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13600</pub-id>
          <pub-id pub-id-type="medline">31414666</pub-id>
          <pub-id pub-id-type="pii">v21i8e13600</pub-id>
          <pub-id pub-id-type="pmcid">PMC6712958</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Lenz</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenbloom</surname>
              <given-names>ST</given-names>
            </name>
          </person-group>
          <article-title>FHIRChain: applying blockchain to securely and scalably share clinical data</article-title>
          <source>Comput Struct Biotechnol J</source>
          <year>2018</year>
          <volume>16</volume>
          <fpage>267</fpage>
          <lpage>78</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2001-0370(18)30037-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.csbj.2018.07.004</pub-id>
          <pub-id pub-id-type="medline">30108685</pub-id>
          <pub-id pub-id-type="pii">S2001-0370(18)30037-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6082774</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dubovitskaya</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ryu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Schumacher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Secure and trustable electronic medical records sharing using blockchain</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>650</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29854130"/>
          </comment>
          <pub-id pub-id-type="medline">29854130</pub-id>
          <pub-id pub-id-type="pmcid">PMC5977675</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mamoshina</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ojomoko</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yanovich</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ostrovski</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Botezatu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Prikhodko</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Izumchenko</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Aliper</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Romantsov</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhebrak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ogu</surname>
              <given-names>IO</given-names>
            </name>
            <name name-style="western">
              <surname>Zhavoronkov</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Converging blockchain and next-generation artificial intelligence technologies to decentralize and accelerate biomedical research and healthcare</article-title>
          <source>Oncotarget</source>
          <year>2018</year>
          <month>01</month>
          <day>19</day>
          <volume>9</volume>
          <issue>5</issue>
          <fpage>5665</fpage>
          <lpage>90</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.impactjournals.com/oncotarget/misc/linkedout.php?pii=22345"/>
          </comment>
          <pub-id pub-id-type="doi">10.18632/oncotarget.22345</pub-id>
          <pub-id pub-id-type="medline">29464026</pub-id>
          <pub-id pub-id-type="pii">22345</pub-id>
          <pub-id pub-id-type="pmcid">PMC5814166</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ozercan</surname>
              <given-names>HI</given-names>
            </name>
            <name name-style="western">
              <surname>Ileri</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Ayday</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Alkan</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Realizing the potential of blockchain technologies in genomics</article-title>
          <source>Genome Res</source>
          <year>2018</year>
          <month>09</month>
          <volume>28</volume>
          <issue>9</issue>
          <fpage>1255</fpage>
          <lpage>63</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://genome.cshlp.org:4040/cgi/pmidlookup?view=long&#38;pmid=30076130"/>
          </comment>
          <pub-id pub-id-type="doi">10.1101/gr.207464.116</pub-id>
          <pub-id pub-id-type="medline">30076130</pub-id>
          <pub-id pub-id-type="pii">gr.207464.116</pub-id>
          <pub-id pub-id-type="pmcid">PMC6120626</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Bhattacharya</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>Prototype of running clinical trials in an untrustworthy environment using blockchain</article-title>
          <source>Nat Commun</source>
          <year>2019</year>
          <month>02</month>
          <day>22</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>917</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30796226"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41467-019-08874-y</pub-id>
          <pub-id pub-id-type="medline">30796226</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41467-019-08874-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC6384889</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zavaleta Rojas</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ohno-Machado</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Comparison of blockchain platforms: a systematic review and healthcare examples</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2019</year>
          <month>05</month>
          <day>1</day>
          <volume>26</volume>
          <issue>5</issue>
          <fpage>462</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocy185</pub-id>
          <pub-id pub-id-type="medline">30907419</pub-id>
          <pub-id pub-id-type="pii">5419321</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>YR</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Na</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Is blockchain technology suitable for managing personal health records? Mixed-methods study to test feasibility</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>02</month>
          <day>8</day>
          <volume>21</volume>
          <issue>2</issue>
          <fpage>e12533</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/2/e12533/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12533</pub-id>
          <pub-id pub-id-type="medline">30735142</pub-id>
          <pub-id pub-id-type="pii">v21i2e12533</pub-id>
          <pub-id pub-id-type="pmcid">PMC6384539</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vazirani</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>O'Donoghue</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Brindley</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Meinert</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Implementing blockchains for efficient health care: systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>02</month>
          <day>12</day>
          <volume>21</volume>
          <issue>2</issue>
          <fpage>e12439</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/2/e12439/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12439</pub-id>
          <pub-id pub-id-type="medline">30747714</pub-id>
          <pub-id pub-id-type="pii">v21i2e12439</pub-id>
          <pub-id pub-id-type="pmcid">PMC6390185</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <source>Cancer Gene Trust</source>
          <access-date>2019-10-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cancergenetrust.org">https://www.cancergenetrust.org</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <source>Ethereum</source>
          <access-date>2019-10-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ethereum.org">https://ethereum.org</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="web">
          <source>IPFS Powers the Distributed Web</source>
          <access-date>2019-10-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ipfs.io">https://ipfs.io</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="web">
          <source>Cancer Gene Trust Protocol</source>
          <access-date>2019-10-27</access-date>
          <comment>Sharing Clinical and Genomic Data in Cancer Research<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cancergenetrust.org/docs/cgt-ucsf-protocol.pdf">https://www.cancergenetrust.org/docs/cgt-ucsf-protocol.pdf</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <source>GitHub</source>
          <access-date>2019-10-27</access-date>
          <comment>Cancer Gene Trust<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.github.com/cancergenetrust">https://www.github.com/cancergenetrust</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Frampton</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Fichtenholtz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Otto</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Downing</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schnall-Levin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sanford</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Juhn</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Iwanik</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Maillet</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Buell</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>White</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Balasubramanian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Terzic</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Richards</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Banning</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mahoney</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zwirko</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Donahue</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Beltran</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Mosquera</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Rubin</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Dogan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hedvat</surname>
              <given-names>CV</given-names>
            </name>
            <name name-style="western">
              <surname>Berger</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Pusztai</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lechner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Boshoff</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jarosz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vietz</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Parker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Curran</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cronin</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Stephens</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lipson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yelensky</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Development and validation of a clinical cancer genomic profiling test based on massively parallel DNA sequencing</article-title>
          <source>Nat Biotechnol</source>
          <year>2013</year>
          <month>11</month>
          <volume>31</volume>
          <issue>11</issue>
          <fpage>1023</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24142049"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/nbt.2696</pub-id>
          <pub-id pub-id-type="medline">24142049</pub-id>
          <pub-id pub-id-type="pii">nbt.2696</pub-id>
          <pub-id pub-id-type="pmcid">PMC5710001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Joseph</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Nasr</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yeh</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Talevich</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Onodera</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bastian</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Rabban</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Garg</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zaloudek</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Solomon</surname>
              <given-names>DA</given-names>
            </name>
          </person-group>
          <article-title>Genomic profiling of malignant peritoneal mesothelioma reveals recurrent alterations in epigenetic regulatory genes BAP1, SETD2, and DDX3X</article-title>
          <source>Mod Pathol</source>
          <year>2017</year>
          <month>02</month>
          <volume>30</volume>
          <issue>2</issue>
          <fpage>246</fpage>
          <lpage>54</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.1038/modpathol.2016.188"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/modpathol.2016.188</pub-id>
          <pub-id pub-id-type="medline">27813512</pub-id>
          <pub-id pub-id-type="pii">modpathol2016188</pub-id>
          <pub-id pub-id-type="pmcid">PMC5288276</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
          <source>Foundation Medicine</source>
          <access-date>2019-10-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.foundationmedicine.com/">https://www.foundationmedicine.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kline</surname>
              <given-names>CN</given-names>
            </name>
            <name name-style="western">
              <surname>Joseph</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Grenert</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>van Ziffle</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Talevich</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Onodera</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Aboian</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cha</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Raleigh</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Braunstein</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Torkildson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Samuel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bloomer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Campomanes</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Banerjee</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Butowski</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Raffel</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tihan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bollen</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Korn</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Yeh</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Bastian</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mueller</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Perry</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nicolaides</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Solomon</surname>
              <given-names>DA</given-names>
            </name>
          </person-group>
          <article-title>Targeted next-generation sequencing of pediatric neuro-oncology patients improves diagnosis, identifies pathogenic germline mutations, and directs targeted therapy</article-title>
          <source>Neuro Oncol</source>
          <year>2017</year>
          <month>05</month>
          <day>1</day>
          <volume>19</volume>
          <issue>5</issue>
          <fpage>699</fpage>
          <lpage>709</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28453743"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/neuonc/now254</pub-id>
          <pub-id pub-id-type="medline">28453743</pub-id>
          <pub-id pub-id-type="pii">now254</pub-id>
          <pub-id pub-id-type="pmcid">PMC5464451</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <source>OHDSI – Observational Health Data Sciences and Informatics</source>
          <access-date>2019-09-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ohdsi.org/">https://www.ohdsi.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stang</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Racoosin</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Overhage</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Hartzema</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Reich</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Welebob</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Scarnecchia</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Woodcock</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Advancing the science for active surveillance: rationale and design for the Observational Medical Outcomes Partnership</article-title>
          <source>Ann Intern Med</source>
          <year>2010</year>
          <month>11</month>
          <day>2</day>
          <volume>153</volume>
          <issue>9</issue>
          <fpage>600</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.7326/0003-4819-153-9-201011020-00010</pub-id>
          <pub-id pub-id-type="medline">21041580</pub-id>
          <pub-id pub-id-type="pii">153/9/600</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <source>Surveillance, Epidemiology, and End Results Program</source>
          <access-date>2019-09-01</access-date>
          <comment>SEER Program Coding and Staging Manual 2018<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://seer.cancer.gov/tools/codingmanuals/">https://seer.cancer.gov/tools/codingmanuals/</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="web">
          <source>NAACCR</source>
          <access-date>2019-09-01</access-date>
          <comment>Data Standards &#38; Data Dictionary, Volume II<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.naaccr.org/data-standards-data-dictionary/">https://www.naaccr.org/data-standards-data-dictionary/</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <source>Cancer Gene Trust</source>
          <access-date>2019-10-27</access-date>
          <comment>dapp<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cancergenetrust.org/docs/about">https://www.cancergenetrust.org/docs/about</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Oskotsky</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Thangaraj</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Giangreco</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Badgeley</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Datta</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Rudrapatna</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Rappoport</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Shervey</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Miotto</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Rutenberg</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Frazier</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Israni</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Larsen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Percha</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dudley</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Tatonetti</surname>
              <given-names>NP</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>PatientExploreR: an extensible application for dynamic visualization of patient clinical history from electronic health records in the OMOP common data model</article-title>
          <source>Bioinformatics</source>
          <year>2019</year>
          <month>11</month>
          <day>1</day>
          <volume>35</volume>
          <issue>21</issue>
          <fpage>4515</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31214700"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btz409</pub-id>
          <pub-id pub-id-type="medline">31214700</pub-id>
          <pub-id pub-id-type="pii">5520433</pub-id>
          <pub-id pub-id-type="pmcid">PMC6821222</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Allaire</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>McPherson</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2015</year>
          <access-date>2019-10-27</access-date>
          <comment>Shiny: web application framework for R<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/shiny/index.html">https://cran.r-project.org/web/packages/shiny/index.html</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perrier</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2018</year>
          <access-date>2019-10-27</access-date>
          <comment>shinyWidgets: Custom Inputs Widgets for Shiny<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/shinyWidgets/shinyWidgets.pdf">https://cran.r-project.org/web/packages/shinyWidgets/shinyWidgets.pdf</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Attali</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2017</year>
          <access-date>2019-10-27</access-date>
          <comment>shinyjs: Easily Improve the User Experience of Your Shiny Apps in Seconds<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/shinyjs/index.html">https://cran.r-project.org/web/packages/shinyjs/index.html</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Attali</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Edwards</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2018</year>
          <access-date>2019-10-27</access-date>
          <comment>shinyalert: Easily Create Pretty Popup Messages (Modals) in 'Shiny'<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/shinyalert/shinyalert.pdf">https://cran.r-project.org/web/packages/shinyalert/shinyalert.pdf</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sali</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2017</year>
          <access-date>2019-10-27</access-date>
          <comment>shinycssloaders: Add CSS Loading Animations to 'shiny' Outputs<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/shinycssloaders/index.html">https://cran.r-project.org/web/packages/shinycssloaders/index.html</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2015</year>
          <access-date>2019-10-27</access-date>
          <comment>shinyBS: Twitter Bootstrap Components for Shiny<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/shinyBS/shinyBS.pdf">https://cran.r-project.org/web/packages/shinyBS/shinyBS.pdf</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2015</year>
          <access-date>2019-10-27</access-date>
          <comment>shinythemes: Themes for Shiny<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/shinythemes/index.html">https://cran.r-project.org/web/packages/shinythemes/index.html</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sievert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Parmer</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hocking</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chamberlain</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ram</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Corvellec</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2017</year>
          <access-date>2019-10-27</access-date>
          <comment>plotly: Create Interactive Web Graphics via 'plotly.js'<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/plotly/index.html">https://cran.r-project.org/web/packages/plotly/index.html</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Attali</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Almende</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2016</year>
          <access-date>2019-10-27</access-date>
          <comment>timevis: Create Interactive Timeline Visualizations in R<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/timevis/index.html">https://cran.r-project.org/web/packages/timevis/index.html</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Oskotsky</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Giangreco</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Thangaraj</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rudrapatna</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Datta</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Frazier</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Larsen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tatonetti</surname>
              <given-names>NP</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>ROMOP: a light-weight R package for interfacing with OMOP-formatted electronic health record data</article-title>
          <source>JAMIA Open</source>
          <year>2019</year>
          <month>04</month>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>10</fpage>
          <lpage>4</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31633087"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamiaopen/ooy059</pub-id>
          <pub-id pub-id-type="medline">31633087</pub-id>
          <pub-id pub-id-type="pmcid">PMC6800657</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dowle</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Srinivasan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gorecki</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chirico</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stetsenko</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Short</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2018</year>
          <access-date>2019-10-27</access-date>
          <comment>data.table: Extension of 'data.frame'<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/data.table/index.html">https://cran.r-project.org/web/packages/data.table/index.html</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Allaire</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Reavis</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gersen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Szopka</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2016</year>
          <access-date>2019-10-27</access-date>
          <comment>DT: A Wrapper of the JavaScript Library 'DataTables'<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/DT/index.html">https://cran.r-project.org/web/packages/DT/index.html</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Couture-Beil</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2018</year>
          <access-date>2019-10-27</access-date>
          <comment>rjson: JSON for R<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/rjson/rjson.pdf">https://cran.r-project.org/web/packages/rjson/rjson.pdf</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wickham</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Francois</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Henry</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <source>CRAN - R Project</source>
          <year>2015</year>
          <access-date>2019-10-27</access-date>
          <comment>dplyr: A grammar of data manipulation<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/dplyr/index.html">https://cran.r-project.org/web/packages/dplyr/index.html</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="web">
          <source>PatientExploreR-CGT</source>
          <access-date>2019-10-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://patientexplorer.cancergenetrust.org">http://patientexplorer.cancergenetrust.org</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lehman</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-III, a freely accessible critical care database</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <month>05</month>
          <day>24</day>
          <volume>3</volume>
          <fpage>160035</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27219127"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id>
          <pub-id pub-id-type="medline">27219127</pub-id>
          <pub-id pub-id-type="pii">sdata201635</pub-id>
          <pub-id pub-id-type="pmcid">PMC4878278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Peissig</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Rasmussen</surname>
              <given-names>LV</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Benoit</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Carrell</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Dikilitas</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Gainer</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Howell</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Klann</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Kullo</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lingren</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mentch</surname>
              <given-names>FD</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Natarajan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pacheco</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wiley</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Facilitating phenotype transfer using a common data model</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <month>08</month>
          <volume>96</volume>
          <fpage>103253</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103253</pub-id>
          <pub-id pub-id-type="medline">31325501</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30172-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC6697565</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Agniel</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>IS</given-names>
            </name>
            <name name-style="western">
              <surname>Weber</surname>
              <given-names>GM</given-names>
            </name>
          </person-group>
          <article-title>Biases in electronic health record data due to processes within the healthcare system: retrospective observational study</article-title>
          <source>Br Med J</source>
          <year>2018</year>
          <month>04</month>
          <day>30</day>
          <volume>361</volume>
          <fpage>k1479</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/cgi/pmidlookup?view=long&#38;pmid=29712648"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.k1479</pub-id>
          <pub-id pub-id-type="medline">29712648</pub-id>
          <pub-id pub-id-type="pmcid">PMC5925441</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rocher</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hendrickx</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>de Montjoye</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Estimating the success of re-identifications in incomplete datasets using generative models</article-title>
          <source>Nat Commun</source>
          <year>2019</year>
          <month>07</month>
          <day>23</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>3069</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31337762"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41467-019-10933-3</pub-id>
          <pub-id pub-id-type="medline">31337762</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41467-019-10933-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC6650473</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
