<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v23i9e31122</article-id>
      <article-id pub-id-type="pmid">34543225</article-id>
      <article-id pub-id-type="doi">10.2196/31122</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Columbia Open Health Data for COVID-19 Research: Database Analysis</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Basch</surname>
            <given-names>Corey</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Estiri</surname>
            <given-names>Hossein</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kruesi</surname>
            <given-names>Lisa</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Fecho</surname>
            <given-names>Karamarie</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Junghwan</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1240-7655</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>Jae Hyun</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8609-7135</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Cong</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6024-3037</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Hripcsak</surname>
            <given-names>George</given-names>
          </name>
          <degrees>MD, MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2664-7614</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Natarajan</surname>
            <given-names>Karthik</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9066-9431</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Ta</surname>
            <given-names>Casey</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4679-805X</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Weng</surname>
            <given-names>Chunhua</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Columbia University</institution>
            <addr-line>Ph-20, 622 W 168 ST</addr-line>
            <addr-line>New York, NY</addr-line>
            <country>United States</country>
            <phone>1 212 304 7907</phone>
            <email>cw2384@cumc.columbia.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9624-0214</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Columbia University</institution>
        <addr-line>New York, NY</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Chunhua Weng <email>cw2384@cumc.columbia.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>9</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>30</day>
        <month>9</month>
        <year>2021</year>
      </pub-date>
      <volume>23</volume>
      <issue>9</issue>
      <elocation-id>e31122</elocation-id>
      <history>
        <date date-type="received">
          <day>11</day>
          <month>6</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>21</day>
          <month>7</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>3</day>
          <month>8</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>3</day>
          <month>8</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Junghwan Lee, Jae Hyun Kim, Cong Liu, George Hripcsak, Karthik Natarajan, Casey Ta, Chunhua Weng. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 30.09.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2021/9/e31122" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>COVID-19 has threatened the health of tens of millions of people all over the world. Massive research efforts have been made in response to the COVID-19 pandemic. Utilization of clinical data can accelerate these research efforts to combat the pandemic since important characteristics of the patients are often found by examining the clinical data. Publicly accessible clinical data on COVID-19, however, remain limited despite the immediate need.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>To provide shareable clinical data to catalyze COVID-19 research, we present Columbia Open Health Data for COVID-19 Research (COHD-COVID), a publicly accessible database providing clinical concept prevalence, clinical concept co-occurrence, and clinical symptom prevalence for hospitalized patients with COVID-19. COHD-COVID also provides data on hospitalized patients with influenza and general hospitalized patients as comparator cohorts.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>The data used in COHD-COVID were obtained from NewYork-Presbyterian/Columbia University Irving Medical Center’s electronic health records database. Condition, drug, and procedure concepts were obtained from the visits of identified patients from the cohorts. Rare concepts were excluded, and the true concept counts were perturbed using Poisson randomization to protect patient privacy. Concept prevalence, concept prevalence ratio, concept co-occurrence, and symptom prevalence were calculated using the obtained concepts.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Concept prevalence and concept prevalence ratio analyses showed the clinical characteristics of the COVID-19 cohorts, confirming the well-known characteristics of COVID-19 (eg, acute lower respiratory tract infection and cough). The concepts related to the well-known characteristics of COVID-19 recorded high prevalence and high prevalence ratio in the COVID-19 cohort compared to the hospitalized influenza cohort and general hospitalized cohort. Concept co-occurrence analyses showed potential associations between specific concepts. In case of acute lower respiratory tract infection in the COVID-19 cohort, a high co-occurrence ratio was obtained with COVID-19–related concepts and commonly used drugs (eg, disease due to coronavirus and acetaminophen). Symptom prevalence analysis indicated symptom-level characteristics of the cohorts and confirmed that well-known symptoms of COVID-19 (eg, fever, cough, and dyspnea) showed higher prevalence than the hospitalized influenza cohort and the general hospitalized cohort.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>We present COHD-COVID, a publicly accessible database providing useful clinical data for hospitalized patients with COVID-19, hospitalized patients with influenza, and general hospitalized patients. We expect COHD-COVID to provide researchers and clinicians quantitative measures of COVID-19–related clinical features to better understand and combat the pandemic.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>COVID-19</kwd>
        <kwd>open data</kwd>
        <kwd>electronic health record</kwd>
        <kwd>data science</kwd>
        <kwd>research</kwd>
        <kwd>data</kwd>
        <kwd>access</kwd>
        <kwd>database</kwd>
        <kwd>symptom</kwd>
        <kwd>cohort</kwd>
        <kwd>prevalence</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>COVID-19 has threatened the health of tens of millions of people all over the world. The global pandemic caused by COVID-19 has sparked massive research efforts in the fight against the novel disease, including characterizing the disease and clinical progression, identifying risk factors for hospitalization, and finding drugs that can be repurposed to lessen disease severity [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. Utilization of clinical data from different institutions, hospitals, and nations can accelerate these research efforts since important characteristics of the patients are often found by examining the shared clinical data. Although many studies sharing epidemiological data [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>], public health [<xref ref-type="bibr" rid="ref6">6</xref>], and social measures [<xref ref-type="bibr" rid="ref7">7</xref>] for COVID-19 research have been conducted, publicly accessible clinical data on COVID-19 remain limited despite the immediate need [<xref ref-type="bibr" rid="ref8">8</xref>], mainly owing to the potential risk to patient privacy that can still exist even after deidentification of the data [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
      <p>Recognizing the need for publicly accessible electronic health record (EHR)–derived data in a broad range of clinical and translational research, we previously developed Columbia Open Health Data (COHD). COHD provides open and easy access to prevalence and co-occurrence statistics on conditions, drugs, procedures, and demographics derived from structured EHR data from NewYork-Presbyterian/Columbia University Irving Medical Center (NYP/CUIMC) [<xref ref-type="bibr" rid="ref10">10</xref>], which serves the large and diverse population of NYC and its surrounding areas. Since its deployment, COHD has accelerated biomedical research by providing 2 informative resources, prevalence and co-occurrence statistics, and their derived association metrics [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref12">12</xref>].</p>
      <p>NYC was one of the first epicenters of COVID-19 in the United States with the first confirmed case on February 29, 2020 [<xref ref-type="bibr" rid="ref13">13</xref>]. As one of the largest academic medical centers in NYC, NYP/CUIMC has admitted more than 4000 patients as of September 1, 2020. We aim to provide shareable clinical data to catalyze future COVID-19 research by presenting Columbia Open Health Data for COVID-19 Research (COHD-COVID), a publicly accessible database providing clinical concept prevalence, the clinical concept prevalence ratio between cohorts, clinical concept co-occurrence, and clinical symptom prevalence for a cohort of hospitalized patients with COVID-19 and comparator cohorts (a cohort of hospitalized patients with influenza and a general hospitalized patient cohort) derived from NYP/CUIMC’s electronic health records. In addition to providing publicly accessible data files via the Figshare data repository, we also developed the COHD-COVID web application programming interface (API) for easy access and better usability.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Methods Overview</title>
        <p>We used the term “concept” to refer to clinical entities and events such as conditions (ie, diagnosis), drugs, and procedures. The concepts and their names are defined by the Observational Medical Outcomes Partnership (OMOP) Common Data Model (CDM). When concepts are referenced in this paper, the name of the concept is styled in italics (eg, <italic>Disorder of respiratory system</italic>) to distinguish the formalized concepts from regular text. We also styled entities in the OMOP CDM (eg, <italic>person_id</italic> column in <italic>condition_occurrence</italic> table) in italics.</p>
        <p><xref rid="figure1" ref-type="fig">Figure 1</xref> depicts the overall workflow to create COHD-COVID. Columbia’s clinical data warehouse was converted to the OMOP CDM. We first filtered the EHR data in accordance with the cohort definitions, and then EHR for each patient’s inpatient visits were identified. Condition, drug, and procedure concepts were obtained from the identified visits. Concept prevalence, concept prevalence ratio, concept co-occurrence, and symptom prevalence analyses followed using the obtained concepts. To protect patient privacy, we excluded rare concepts observed in 10 or fewer visits and perturbed the true counts using Poisson randomization. Perturbation of the true counts and exclusion of rare concepts reduce the uniqueness of individual in the data, which can minimize the risk of reidentification [<xref ref-type="bibr" rid="ref9">9</xref>]. Perturbed counts generated by the Poisson randomization process do not show a significant difference from the true counts [<xref ref-type="bibr" rid="ref10">10</xref>]. The resulting data were stored in a MySQL database and made publicly available via the COHD-COVID web API [<xref ref-type="bibr" rid="ref14">14</xref>]. All analyses were conducted using Python 3.5.2. This study received institutional review board approval with a waiver for informed consent.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Overall workflow of Columbia Open Health Data for COVID-19 Research (COHD-COVID). API: application programming interface; NYP/CUIMC: NewYork-Presbyterian/Columbia University Irving Medical Center; OMOP CDM: Observational Medical Outcomes Partnership Common Data Model.</p>
          </caption>
          <graphic xlink:href="jmir_v23i9e31122_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Source</title>
        <p>We utilized EHR data from the NYP/CUIMC’s clinical data warehouse, where inpatient and outpatient data dating back to 1985 are stored. EHR data were collected during routine clinical care. Patients were notified of potential uses of their data for research at the point of care and data collection. NYP/CUIMC has converted its clinical data warehouse to OMOP CDM on a regular basis. Since NYP/CUIMC covers NYC and the surrounding area, which has a diverse population of 8.2 million people and was an early COVID-19 epicenter, the EHR data from NYP/CUIMC can provide a diverse and large sample of patients with COVID-19.</p>
        <p>Three different patient cohorts were used in this study. The COVID-19 cohort was defined as hospitalized patients aged ≥18 years with a COVID-19–related condition diagnosis or a confirmed positive COVID-19 test result during their hospitalization period or within the prior 21 days. Patients identified with the COVID-19 cohort definition from March 1, 2020, to September 1, 2020, were included in the COVID-19 cohort. The influenza cohort was similarly defined as patients aged ≥18 years who had at least 1 occurrence of influenza conditions or precoordinated positive measurements or positive influenza test results during their hospitalization period or within the prior 21 days. The general cohort was defined as all hospitalized patients aged ≥18 years. Patient visits from calendar years 2014 to 2019 were included for the influenza and general cohorts. All cohorts were divided into subcohorts stratified by sex (male vs female) and age (adults aged 18-64 years vs seniors aged &#62;65 years) for further investigation. The COVID-19 and influenza cohort definitions were adapted from the cohort definitions created by the Observational Health Data Science and Informatics’ (OHDSI’s) international network study for COVID-19 [<xref ref-type="bibr" rid="ref3">3</xref>]. Summary statistics of the cohorts are provided in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <p>Patients belonging to the cohorts based on the 3 cohort definitions above were identified using the unique <italic>person_id</italic> from the <italic>person</italic> table in the OMOP CDM. Condition, drug, and procedure concepts observed in these patients during inpatient visits were extracted from the <italic>condition_occurrence</italic>, <italic>drug_exposure</italic>, and <italic>procedure_occurrence</italic> tables in the OMOP CDM, respectively. Inpatient visits of patients and the concepts in these visits were identified using <italic>person_id</italic> along with <italic>visit_occurrence_id</italic> from the <italic>visit_occurrence</italic> table. We used visit-based counts instead of patient-based counts in the following analyses for robust comparison between cohorts that had different observation windows. For example, if we use patient-based counts, the patients included in cohorts with longer observation windows are likely to be observed with more concepts than the patients in cohorts with shorter observation windows, which could inject bias into the metrics used in the analyses. Thus, we used visit-based counts to mitigate the effect of different observation window lengths to reduce the bias.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Basic statistics of 3 cohorts in the Columbia Open Health Data for COVID-19 Research database. The statistics summarized here are based on the data from NewYork-Presbyterian/Columbia University Irving Medical Center as of September 1, 2020.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>COVID-19 cohort</td>
                <td>Influenza cohort</td>
                <td>General cohort<break/>  <break/>  </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Time range</td>
                <td>March 1, 2020, to August 31, 2020</td>
                <td>January 1, 2014, to December 12, 2019</td>
                <td>January 1, 2014, to December 12, 2019</td>
              </tr>
              <tr valign="top">
                <td>Patients, n</td>
                <td>4127</td>
                <td>3261</td>
                <td>175,930</td>
              </tr>
              <tr valign="top">
                <td>Total inpatient visits, n</td>
                <td>4846</td>
                <td>3860</td>
                <td>314,680</td>
              </tr>
              <tr valign="top">
                <td>Male patients; inpatient visits, n (%)</td>
                <td>2103 (51.0); 2518 (52.0)</td>
                <td>1454 (44.6); 1732 (44.9)</td>
                <td>67,662 (38.5); 128,908 (41.0)</td>
              </tr>
              <tr valign="top">
                <td>Female patients; inpatient visits, n (%)</td>
                <td>2024 (49.0); 2328 (48.0)</td>
                <td>1807 (55.4); 2128 (55.1)</td>
                <td>108,268 (61.5); 185,772 (59.0)</td>
              </tr>
              <tr valign="top">
                <td>Adult patients (aged 18-64 years); inpatient visits, n (%)</td>
                <td>2147 (52.0); 2511 (51.8)</td>
                <td>1315 (40.3); 1553 (40.2)</td>
                <td>104,020 (59.1); 173,843 (55.2)</td>
              </tr>
              <tr valign="top">
                <td>Senior patients (&#62;65 years); inpatient visits, n (%)</td>
                <td>1980 (48.0); 2335 (48.2)</td>
                <td>1946 (59.7); 2307 (59.8)</td>
                <td>71,910 (40.9); 140,837 (44.8)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Concept Prevalence and Concept Prevalence Ratio Analysis</title>
        <p>We calculated the concept prevalence in each cohort as detected from the EHR. The concept prevalence is defined as in equation <bold>(1)</bold>.</p>
        <disp-formula>
          <graphic xlink:href="jmir_v23i9e31122_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </disp-formula>
        <p>where <inline-graphic xlink:href="jmir_v23i9e31122_fig9.png" xlink:type="simple" mimetype="image"/> is the prevalence of concept <italic>C</italic> in cohort <italic>H</italic>, <inline-graphic xlink:href="jmir_v23i9e31122_fig10.png" xlink:type="simple" mimetype="image"/> is the set of unique inpatient visits of patients in cohort <italic>H</italic> observed with concept <italic>C</italic>, and <italic>T<sub>H</sub></italic> is the set of unique inpatient visits of patients in cohort <italic>H.</italic> We also calculated hierarchical concept prevalence by defining <inline-graphic xlink:href="jmir_v23i9e31122_fig10.png" xlink:type="simple" mimetype="image"/> as the set of unique visits of patients observed with concept <italic>C</italic> or any of concept <italic>C</italic>’s descendant concepts as defined in the <italic>concept_ancestor</italic> table in the OMOP CDM. For example, the hierarchical count for <italic>Ibuprofen</italic> (OMOP concept ID 1177480) not only includes entries where the specific concept <italic>Ibuprofen</italic> was used, but also includes entries using other descendant concepts, such as <italic>Ibuprofen 600 MG Oral Tablet</italic> (OMOP concept ID 19019073). Taking hierarchical relationships into account mitigates some of the issues with coding variations across time and practices as different concepts with minor semantic differences can be aggregated into higher-level concepts.</p>
        <p>The concept prevalence ratio indicates how frequently concept <italic>C</italic> occurs in cohort <italic>A</italic> relative to cohort <italic>B</italic>. The natural logarithm of the concept prevalence ratio is defined as in equation <bold>(2)</bold>.</p>
        <disp-formula>
          <graphic xlink:href="jmir_v23i9e31122_fig11.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </disp-formula>
        <p>where <italic>LR</italic>(<italic>C<sub>A,B</sub></italic>) is the log ratio of the prevalence of concept <italic>C</italic> for cohort <italic>A</italic> to cohort <italic>B</italic>, <inline-graphic xlink:href="jmir_v23i9e31122_fig12.png" xlink:type="simple" mimetype="image"/> is prevalence of concept <italic>C</italic> in cohort <italic>A</italic>, and <inline-graphic xlink:href="jmir_v23i9e31122_fig13.png" xlink:type="simple" mimetype="image"/> is prevalence of concept <italic>C</italic> in cohort <italic>B</italic>. Hierarchical concept prevalence ratio can be calculated by using hierarchical concept prevalence <inline-graphic xlink:href="jmir_v23i9e31122_fig12.png" xlink:type="simple" mimetype="image"/> and <inline-graphic xlink:href="jmir_v23i9e31122_fig13.png" xlink:type="simple" mimetype="image"/>.</p>
      </sec>
      <sec>
        <title>Concept Co-occurrence Analysis</title>
        <p>Concept co-occurrence represents how frequently a specific concept pair appears in a cohort. We defined concept co-occurrence prevalence as in equation <bold>(3)</bold>.</p>
        <disp-formula>
          <graphic xlink:href="jmir_v23i9e31122_fig14.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </disp-formula>
        <p>where <inline-graphic xlink:href="jmir_v23i9e31122_fig15.png" xlink:type="simple" mimetype="image"/> is the co-occurrence prevalence of concepts <italic>C<sub>1</sub></italic> and <italic>C<sub>2</sub></italic> in cohort <italic>H</italic>, <inline-graphic xlink:href="jmir_v23i9e31122_fig16.png" xlink:type="simple" mimetype="image"/> is the set of unique visits of patients observed with concept <italic>C<sub>1</sub></italic> and <italic>C<sub>2</sub></italic> in cohort <italic>H</italic>, and <italic>T<sub>H</sub></italic> is the set of unique visits of patients in the cohort <italic>H</italic>. We also calculated hierarchical concept co-occurrence using the hierarchy of concepts as described above.</p>
      </sec>
      <sec>
        <title>COVID-19 Symptom Prevalence Analysis</title>
        <p>Since clinical symptoms often include multiple granular clinical concepts, a set of related concepts for a symptom is required to calculate the prevalence of the symptom. For example, dyspnea, which is one of the major symptoms of COVID-19, can be detected as standard concept <italic>Dyspnea</italic> or <italic>Acute respiratory distress</italic> in different patients. The 2 concepts do not have any hierarchical relationship and thus will not be aggregated by the hierarchical prevalence analyses. Thus, a concept set containing both <italic>Dyspnea</italic> and <italic>Acute respiratory distress</italic> is needed for accurate calculation of the prevalence of dyspnea. We defined symptom prevalence as in equation <bold>(4)</bold>.</p>
        <disp-formula>
          <graphic xlink:href="jmir_v23i9e31122_fig17.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </disp-formula>
        <p>where <inline-graphic xlink:href="jmir_v23i9e31122_fig18.png" xlink:type="simple" mimetype="image"/> is prevalence of symptom <italic>S</italic> in cohort <italic>H</italic>, <inline-graphic xlink:href="jmir_v23i9e31122_fig19.png" xlink:type="simple" mimetype="image"/> is the set of unique visits of patients observed with concept <italic>C<sub>i</sub></italic>, <italic>T<sub>H</sub></italic> is the set of unique visits of patients observed in the cohort <italic>H</italic>, <italic>s</italic> is the number of the unique concepts in the concept set for symptom <italic>S</italic>, and ∪ is the union operator. Hierarchy between concepts is not considered in the symptom prevalence analysis since a concept set of a symptom already reflects hierarchy for that symptom.</p>
        <p>We used concept sets for 11 major symptoms of COVID-19 (<italic>Cough</italic>, <italic>Chills</italic>, <italic>Abdominal pain</italic>, <italic>Diarrhea</italic>, <italic>Dyspnea</italic>, <italic>Fatigue</italic>, <italic>Fever</italic>, <italic>Myalgia</italic>, <italic>Nausea and vomiting</italic>, <italic>Tachypnea</italic>, and <italic>Throat pain</italic>), which have been defined by OHDSI to calculate symptom prevalence. The concepts included in each symptom are available in Figshare [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
      </sec>
      <sec>
        <title>Data Quality Analysis</title>
        <p>Assessing the quality of EHR data is critical for its effects on secondary analysis for research in the health care and medical domains [<xref ref-type="bibr" rid="ref16">16</xref>]. We calculated the sum of nonrandomized counts of all concepts on a monthly basis for the COVID-19 cohort and on a yearly basis for the general and influenza cohorts. For each of the condition, drug, and procedure domains, we examined the total counts of concepts with the number of visits to detect any issues regarding data quality and temporal plausibility of the EHR data we used in the study [<xref ref-type="bibr" rid="ref17">17</xref>]. We also calculated the annual mean (SD) values of concept prevalence and concept co-occurrence for the general and influenza cohorts to assess the temporal variance of each concept and concept co-occurrence pair.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Results Overview</title>
        <p>In this section, we show a sample of the results of analyses using the data from COHD-COVID. Since COHD-COVID contains massive amounts of data covering several thousand concepts, it is worth noting that only a small sample of the results is shown in this section. Users can obtain the results of interest in addition to the results shown in this section by using the COHD-COVID API [<xref ref-type="bibr" rid="ref14">14</xref>] or by downloading the flat data files from Figshare [<xref ref-type="bibr" rid="ref15">15</xref>]. The results of all analyses, concept definitions, and concepts included in each symptom are available as tab-delimited flat files in Figshare, except the concept prevalence ratio analyses, since they can be directly computed from concept prevalence data. COHD-COVID API [<xref ref-type="bibr" rid="ref14">14</xref>] provides all results.</p>
      </sec>
      <sec>
        <title>Concept Prevalence Analysis</title>
        <p><xref rid="figure2" ref-type="fig">Figure 2</xref> shows the prevalence of 10 condition (<xref rid="figure2" ref-type="fig">Figure 2</xref>A) and drug concepts (<xref rid="figure2" ref-type="fig">Figure 2</xref>B) in the COVID-19 cohort, influenza cohort, and general cohort. We chose the 10 most prevalent condition and drug concepts in the COVID-19 cohort for this use case. For drug concepts, we chose the most prevalent drug ingredient concepts using hierarchical analysis to count multiple drugs that have different brand names, dosages, and formulations but are based on the same ingredients together. The condition concepts were chosen without hierarchical analysis to identify the top 10 specific conditions. <italic>Fever</italic> showed the highest prevalence (0.2619) among all condition concepts for the COVID-19 cohort, followed by <italic>Cough</italic> (0.2491) and <italic>Dyspnea</italic> (0.2594). <italic>Acetaminophen</italic> was the most prevalent (0.7912) drug ingredient used for patients with COVID-19, followed by <italic>Enoxaparin</italic> (0.5803) and <italic>Glucose</italic> (0.4424). <xref rid="figure3" ref-type="fig">Figures 3</xref> and <xref rid="figure4" ref-type="fig">4</xref> show the prevalence of 10 condition and drug concepts, respectively, in the COVID-19 cohort stratified by age (<xref rid="figure3" ref-type="fig">Figures 3</xref>A and 4A) and gender (<xref rid="figure4" ref-type="fig">Figure 4</xref>A and 4B). The 10 condition and drug concepts were the top 10 most prevalent concepts in the full COVID-19 cohort without stratification.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>(A) Condition and (B) drug concept prevalence in the COVID-19 cohort, influenza cohort, and general cohort.</p>
          </caption>
          <graphic xlink:href="jmir_v23i9e31122_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Condition concept prevalence in (A) age and (B) sex sub-cohorts of the COVID-19 cohort. The full COVID-19 cohort indicates original COVID-19 cohort without stratification.</p>
          </caption>
          <graphic xlink:href="jmir_v23i9e31122_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Drug concept prevalence in (A) age and (B) sex subcohorts of the COVID-19 cohort. The full COVID-19 cohort indicates original COVID-19 cohort without stratification.</p>
          </caption>
          <graphic xlink:href="jmir_v23i9e31122_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Concept Prevalence Ratio Analysis</title>
        <p><xref ref-type="table" rid="table2">Table 2</xref> shows the top 10 condition concepts that showed the highest concept prevalence ratio for the COVID-19 cohort relative to the comparator cohorts (general cohort and influenza cohort). <italic>Disease due to Coronavirus</italic> and <italic>Acute lower respiratory tract infection</italic> showed the highest concept prevalence ratio for the COVID-19 cohort relative to the influenza cohort and the general cohort, respectively.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Top 10 condition concepts that show the highest concept prevalence ratio for the COVID-19 cohort relative to the general and influenza cohorts.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Influenza cohort (prevalence ratio)</td>
                <td>General cohort (prevalence ratio)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Disease due to Coronavirus (3.28)</td>
                <td>Acute lower respiratory tract infection (7.30)</td>
              </tr>
              <tr valign="top">
                <td>Disorientated (2.44)</td>
                <td>Disorder of respiratory system (5.56)</td>
              </tr>
              <tr valign="top">
                <td>Blood chemistry abnormal (2.25)</td>
                <td>General finding of observation of patient (5.17)</td>
              </tr>
              <tr valign="top">
                <td>Acute respiratory distress syndrome (2.16)</td>
                <td>Outcome of delivery – finding (5.13)</td>
              </tr>
              <tr valign="top">
                <td>Cerebral infarction (1.84)</td>
                <td>Chest pain on breathing (5.09)</td>
              </tr>
              <tr valign="top">
                <td>Cough (1.81)</td>
                <td>Disease due to Coronavirus (4.95)</td>
              </tr>
              <tr valign="top">
                <td>Viral pneumonia (1.61)</td>
                <td>Patient status finding (4.60)</td>
              </tr>
              <tr valign="top">
                <td>Acute respiratory distress (1.52)</td>
                <td>Unplanned pregnancy (4.23)</td>
              </tr>
              <tr valign="top">
                <td>Heart disease (1.32)</td>
                <td>Acute respiratory distress syndrome (4.17)</td>
              </tr>
              <tr valign="top">
                <td>Delivery normal (1.28)</td>
                <td>Deliveries by cesarean (3.98)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Concept Co-occurrence Analysis</title>
        <p><xref ref-type="table" rid="table3">Table 3</xref> shows the top 10 most frequently co-occurring concepts with <italic>Acute lower respiratory tract infection</italic> in the COVID-19 cohort. <italic>Acute lower respiratory tract infection</italic> was chosen among the 10 most prevalent condition concepts in the COVID-19 cohort. We used nonhierarchical concept co-occurrence to obtain the result.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>The 10 concepts that most frequently co-occurred with Acute lower respiratory tract infection in the full COVID-19 cohort.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="770"/>
            <col width="230"/>
            <thead>
              <tr valign="top">
                <td>Concept name</td>
                <td>Co-occurrence prevalence</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Disease due to Coronavirus</td>
                <td>0.2329</td>
              </tr>
              <tr valign="top">
                <td>Radiologic examination, chest; single view</td>
                <td>0.2214</td>
              </tr>
              <tr valign="top">
                <td>Infectious agent detection by nucleic acid (DNA or RNA); severe acute respiratory syndrome coronavirus 2</td>
                <td>0.2205</td>
              </tr>
              <tr valign="top">
                <td>Acetaminophen 325 MG Oral Tablet</td>
                <td>0.2037</td>
              </tr>
              <tr valign="top">
                <td>0.4 ML Enoxaparin sodium 100 MG/ML Prefilled Syringe</td>
                <td>0.1504</td>
              </tr>
              <tr valign="top">
                <td>Hydroxychloroquine Sulfate 200 MG Oral Tablet</td>
                <td>0.1246</td>
              </tr>
              <tr valign="top">
                <td>50 ML Glucose 500 MG/ML Prefilled Syringe</td>
                <td>0.1085</td>
              </tr>
              <tr valign="top">
                <td>Ceftriaxone 1000 MG Injection</td>
                <td>0.1073</td>
              </tr>
              <tr valign="top">
                <td>Blood typing, serologic; ABO</td>
                <td>0.1044</td>
              </tr>
              <tr valign="top">
                <td>Glucose 0.4 MG/MG Oral Gel</td>
                <td>0.0970</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>COVID-19 Symptom Prevalence Analysis</title>
        <p><xref rid="figure5" ref-type="fig">Figure 5</xref> shows the prevalence of the 11 major COVID-19 symptoms for all 3 cohorts. In the COVID-19 cohort, <italic>Dyspnea</italic> showed the highest prevalence among the 11 symptoms followed by <italic>Fever</italic> and <italic>Cough</italic>.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Symptom prevalence of 11 major symptoms in patients with COVID-19 for all 3 cohorts.</p>
          </caption>
          <graphic xlink:href="jmir_v23i9e31122_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Quality Analysis</title>
        <p><xref rid="figure6" ref-type="fig">Figure 6</xref> shows the total counts across all concepts in the condition domain (<xref rid="figure6" ref-type="fig">Figure 6</xref>A), drug domain (<xref rid="figure6" ref-type="fig">Figure 6</xref>B), procedure domain (<xref rid="figure6" ref-type="fig">Figure 6</xref>C), and the total visits per month between March 2020 and August 2020 (<xref rid="figure6" ref-type="fig">Figure 6</xref>D) for the COVID-19 cohort. The total counts of conditions, drugs, procedures, and total visits all show steep increases in March and April 2020, when the number of COVID-19 cases surged in NYC (<xref rid="figure6" ref-type="fig">Figure 6</xref>E) [<xref ref-type="bibr" rid="ref18">18</xref>]. The total counts of all domains and the total visits decreased starting May 2020 as the number of patients with COVID-19 in NYC decreased.</p>
        <p><xref rid="figure7" ref-type="fig">Figure 7</xref> shows the total counts per year across all concepts in the condition domain (<xref rid="figure7" ref-type="fig">Figure 7</xref>A), drug domain (<xref rid="figure7" ref-type="fig">Figure 7</xref>B), procedure domain (<xref rid="figure7" ref-type="fig">Figure 7</xref>C), and the total visits per year between 2014 and 2019 (<xref rid="figure7" ref-type="fig">Figure 7</xref>D) for the general cohort and influenza cohort. The total counts of conditions, drugs, procedures, and total visits per year for the 2 cohorts show consistent trends.</p>
        <p>The annual mean (SD) value of concept prevalence and concept co-occurrence for the general and influenza cohorts are available in Figshare [<xref ref-type="bibr" rid="ref15">15</xref>] to assess the temporal variance of each concept and concept co-occurrence pair. The mean and standard deviation of annual concept prevalence and co-occurrence should only be compared to each other to assess the stability of the concept over the given time period of the data set.</p>
        <p>A change in the EHR system can affect the quality and characteristics of EHR data collected for secondary research. NYP/CUIMC changed its EHR system as of February 1, 2020, from Allscripts to Epic, which might affect the COVID-19 cohort data and its characteristics as opposed to the influenza and general cohorts, which were collected prior to the EHR change. To detect the impact of the change, we performed a <italic>t</italic> test for all concepts reported in the COVID-19 cohort between the counts from a pre-Epic period (January 1, 2020, to January 31, 2020) and from a post-Epic period (February 1, 2020, to February 29, 2020). The post-Epic period was chosen to minimize the inclusion of dates when COVID-19 would have impacted clinical practices in NYC. The counts of concepts were recorded on a daily basis. We considered that there would be no difference between the 2 periods if the counts for the concept from the 2 periods are the same (ie, all 0 counts for the 2 periods). Of all 1066 unique concepts reported in the COVID-19 cohort, 119 (11.2%) concepts showed a significant difference (<italic>P</italic>≤.01) between the pre- and post-Epic periods. The <italic>P</italic> values of the <italic>t</italic> tests for all individual concepts are available in Figshare [<xref ref-type="bibr" rid="ref15">15</xref>] to allow users to factor in these data quality considerations for each concept.</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Total counts across all concepts in the (A) condition domain, (B) drug domain, (C) procedure domain, and (D) the total visits per month between March 2020 and August 2020 for the COVID-19 cohort. (E) Total COVID-19–positive cases per day in New York City from March 2020 to August 2020.</p>
          </caption>
          <graphic xlink:href="jmir_v23i9e31122_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Total counts across all concepts in the (A) condition domain, (B) drug domain, (C) procedure domain, and (D) the total visits per year between 2014 and 2019 for the general and influenza cohort.</p>
          </caption>
          <graphic xlink:href="jmir_v23i9e31122_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this study, we present a publicly accessible database providing clinical concept prevalence, clinical concept co-occurrence, and clinical symptom prevalence for hospitalized patients with COVID-19, hospitalized patients with influenza, and general hospitalized patients. We showed the utility of the data for future data-driven studies by exploring the results of the concept prevalence analysis, concept prevalence ratio analysis, concept co-occurrence analysis, and symptom prevalence analysis. Results from the analyses aligned with published findings and can be used to find novel hypotheses as described in the following discussion. The results of all analyses were provided as flat files in Figshare [<xref ref-type="bibr" rid="ref15">15</xref>] and also easily accessible through web API [<xref ref-type="bibr" rid="ref14">14</xref>].</p>
        <p>Concept prevalence analysis on the 3 cohorts can be used to determine the clinical characteristics of the COVID-19 cohort. A comparison of the prevalence of these concepts between the COVID-19 cohort and the influenza or general cohorts provides contextual evidence regarding whether the concept is associated with COVID-19 or if it is common among hospitalized patients. <xref rid="figure2" ref-type="fig">Figure 2</xref>A shows that <italic>Fever</italic>, <italic>Cough</italic>, <italic>Dyspnea</italic>, and <italic>Acute lower respiratory syndrome</italic> were more highly prevalent in the COVID-19 cohort than in the 2 comparator cohorts. The concepts highly prevalent in the COVID-19 cohort were well-known symptoms of COVID-19, concurrent with existing studies. As shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>B, <italic>Hydroxychloriquine</italic>, which was one of the drugs widely administered to patients with COVID-19 [<xref ref-type="bibr" rid="ref19">19</xref>] during the early months of the pandemic, showed high prevalence in the COVID-19 cohort.</p>
        <p>Concept prevalence analysis on the COVID-19 cohort and its subcohorts can be used to determine the clinical characteristics of the subcohorts and determine if these characters differ between the sexes or between adult and older patients. <xref rid="figure3" ref-type="fig">Figure 3</xref>A shows that the senior cohort had higher prevalences in all 10 condition concepts than the full and adult cohorts and also shows that <italic>Essential hypertension</italic> and <italic>Hypoxemia</italic> were particularly more prevalent in senior patients with COVID-19, which indicates that senior patients are more likely to have these apparent symptoms of COVID-19 than adult patients. <xref rid="figure4" ref-type="fig">Figure 4</xref>A shows that drug ingredients related to type 2 diabetes (eg, <italic>Glucose</italic> and <italic>Insulin Lispro</italic>) showed higher prevalence in senior patients than in adult patients, which indicates that type 2 diabetes is a more common comorbidity among senior patients with COVID-19.</p>
        <p>Concept prevalence ratio analysis can be used to unveil how often specific concepts appeared in the COVID-19 cohort compared to the comparator cohorts. <xref ref-type="table" rid="table2">Table 2</xref> shows that common and general symptoms of COVID-19 (eg, <italic>Chest pain on breathing</italic>, <italic>Cough</italic>, and <italic>Disease due to coronavirus</italic>) showed a high prevalence ratio in the COVID-19 cohort relative to the general cohort. In contrast, more severe symptoms of COVID-19 (eg, <italic>Disoriented</italic>, <italic>Acute respiratory distress syndrome</italic>, <italic>Viral pneumonia</italic>, and <italic>Blood chemistry abnormal</italic>) showed a higher prevalence ratio in the COVID-19 cohort than in the influenza cohort. Since both cohorts include hospitalized patients, these results may indicate that the aforementioned conditions are more strongly associated with the SARS-CoV-2 infection than with influenza. We also observed high prevalence ratios in concepts related to delivery in the COVID-19 cohort relative to the general cohort. Regrading <italic>Outcome of delivery – finding</italic>; for example, we observed a visit prevalence rate of 1.18% in the COVID-19 cohort, but only 0.0070% in the general cohort, yielding a prevalence ratio of 5.13. During normal times, deliveries only account for a small fraction of all inpatient visits. However, during the pandemic, there was a dramatic decrease in elective surgeries and hospitalizations besides those related to COVID-19 since hospital capacity was diverted their focus toward patients with COVID-19. In contrast, patients going into labor cannot be rescheduled and were regularly tested for SARS-CoV-2, which increased their representation within the COVID-19 cohort.</p>
        <p>Potential associations between specific concepts of interest can be found through co-occurrence analysis. For instance, <xref ref-type="table" rid="table3">Table 3</xref> confirms that the concepts associated with SARS-CoV-2 tests (ie, <italic>Disease due to Coronavirus</italic>, <italic>Radiologic examination, chest; single view</italic>, and <italic>Infectious agent detection by nucleic acid [DNA or RNA]; severe acute respiratory syndrome coronavirus 2</italic>) showed high co-occurrence prevalence with <italic>Acute lower respiratory tract infection</italic>, which shows natural strong associations between testing concepts for COVID-19 and one of the most prevalent concepts in the COVID-19 cohort.</p>
        <p>Symptom prevalence analysis can be used to examine symptom-level characteristics of the cohorts. The COVID-19 cohort showed higher prevalence in dyspnea, fever, and cough symptoms than the other 2 comparator cohorts, which is concurrent with the known characteristics and symptoms of COVID-19 [<xref ref-type="bibr" rid="ref20">20</xref>]. In contrast, a few of the known COVID-19 symptoms (eg, myalgia, throat pain, and chills) did now show high prevalence in the COVID-19 cohort, which might indicate that those symptoms are not clinically distinctively prevalent in patients with COVID-19.</p>
        <p>Most of the results from the analyses align with those of existing studies, thus empirically validating the utility of COHD-COVID. COHD-COVID also can be used to find novel hypotheses related COVID-19. COHD-COVID can be used as cross-institutional data to validate or support other COVID-19 studies. For instance, the high prevalence ratio of <italic>Cerebral infarction</italic> in the COVID-19 cohort compared to that in the influenza cohort (<xref ref-type="table" rid="table2">Table 2</xref>) corroborates with reports from a few studies that SARS-CoV-2 might be more likely to cause thrombotic vascular events, including stroke, than other coronavirus and seasonal infectious diseases [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>].</p>
        <p>While we admit that the aggregated concept-level analyses may not be suitable to answer some clinical research questions, COHD-COVID will be useful for hypothesis generation and for validating emerging newly published findings on COVID-19 using real-world data. COHD, the precedent study of COHD-COVID, has been integrated into the National Center for Advancing Translational Sciences Biomedical Data Translator program, where the EHR-based data associations from COHD are linked to other sources of knowledge via knowledge graphs, allowing automated algorithms to perform reasoning on these knowledge graphs to answer biomedical questions and suggest novel hypotheses [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>].</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>There are several limitations to this study, which should be noted. One of the limitations is that analyses performed in this study can be affected by the factors included in the data acquisition process (eg, change in the EHR system, human biases, and errors during entry). For example, coding trends and patterns (ie, the trend and pattern of frequently used concepts) can be changed through a shift in system. Another limitation is that multiple visits from the same patient can be used to calculate the metrics in the analyses since we used visit-based counts instead of patient-based counts for the analyses. This could affect the results of the specific concepts appearing in patients who are hospitalized more frequently. We also admit that some of results from the analyses cannot be validated by existing or up-to-date findings, considering rapidly growing and changing knowledge related to COVID-19. Thus, it is desirable to conduct a literature search before utilizing the data and results. We will update the data and results on a regular basis to further alleviate this limitation.</p>
        <p>The EHR data used in this study were obtained from a single site: NYP/CUIMC. Even though NYP/CUIMC is a large academic medical center whose services cover the city and its surrounding areas, we admit that performing the analyses on the basis of the EHR data across multiple institutions and nations will be beneficial since multiple sites can diversify the population, improve accuracy, increase power and sensitivity to rare conditions, validate results by comparing across sites, and reduce variance that might exist in specific locations. Since the OMOP CDM provides the fundamentals to perform the same analyses on clinical data across different sites, we hope to collaborate with future studies sharing clinical characteristics of patients with COVID-19 and to generate a larger, richer, and more robust database that can be leveraged in translational research on COVID-19.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In this study, we present COHD-COVID, a publicly accessible database providing useful clinical data for hospitalized patients with COVID-19, hospitalized patients with influenza, and general hospitalized patients. The analyses using the data from COHD-COVID confirmed the well-known clinical characteristics of patients with COVID-19 and can also be used to find novel hypotheses related to COVID-19. We expect COHD-COVID will provide researchers and clinicians quantitative measures of COVID-19–related clinical features to better understand and combat the pandemic.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">COHD</term>
          <def>
            <p>Columbia Open Health Data</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">COHD-COVID</term>
          <def>
            <p>Columbia Open Health Data for COVID-19 Research</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">EHR</term>
          <def>
            <p>Electronic health records</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NYP/CUIMC</term>
          <def>
            <p>NewYork-Presbyterian/Columbia University Irving Medical Center</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">OHDSI</term>
          <def>
            <p>Observational Health Data Science and Informatics</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">OMOP CDM</term>
          <def>
            <p>Observational Medical Outcomes Partnership Common Data Model</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was supported by National Library of Medicine grant R01LM012895-03S1 and National Center for Advancing Translational Science grant 1OT2TR003434-01.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Guan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Clinical course and risk factors for mortality of adult inpatients with COVID-19 in Wuhan, China: a retrospective cohort study</article-title>
          <source>Lancet</source>
          <year>2020</year>
          <month>03</month>
          <day>28</day>
          <volume>395</volume>
          <issue>10229</issue>
          <fpage>1054</fpage>
          <lpage>1062</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32171076"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(20)30566-3</pub-id>
          <pub-id pub-id-type="medline">32171076</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(20)30566-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC7270627</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Modi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sagar</surname>
              <given-names>SR</given-names>
            </name>
          </person-group>
          <article-title>In silico studies on therapeutic agents for COVID-19: Drug repurposing approach</article-title>
          <source>Life Sci</source>
          <year>2020</year>
          <month>07</month>
          <day>01</day>
          <volume>252</volume>
          <fpage>117652</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32278693"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.lfs.2020.117652</pub-id>
          <pub-id pub-id-type="medline">32278693</pub-id>
          <pub-id pub-id-type="pii">S0024-3205(20)30400-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC7194845</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Burn</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>You</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Sena</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Kostka</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Abedtash</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Abrahão</surname>
              <given-names>MTF</given-names>
            </name>
            <name name-style="western">
              <surname>Alberga</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alghoul</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Alser</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Alshammari</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Aragon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Areia</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Banda</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Culhane</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Davydov</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>DeFalco</surname>
              <given-names>FJ</given-names>
            </name>
            <name name-style="western">
              <surname>Duarte-Salles</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>DuVall</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Falconer</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fernandez-Bertolin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Golozar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hardin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Huser</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Jeon</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jing</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>CY</given-names>
            </name>
            <name name-style="western">
              <surname>Kaas-Hansen</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Kaduk</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kent</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kolovos</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lane</surname>
              <given-names>JCE</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Makadia</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Matheny</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>PP</given-names>
            </name>
            <name name-style="western">
              <surname>Morales</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Natarajan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nyberg</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ostropolets</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Posada</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Prats-Uribe</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Reich</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rho</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rijnbeek</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Schilling</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Schuemie</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Shoaibi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Spotnitz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Suchard</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Swerdel</surname>
              <given-names>JN</given-names>
            </name>
            <name name-style="western">
              <surname>Vizcaya</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Volpe</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Yimer</surname>
              <given-names>BB</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhuk</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Prieto-Alhambra</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Deep phenotyping of 34,128 adult patients hospitalised with COVID-19 in an international network study</article-title>
          <source>Nat Commun</source>
          <year>2020</year>
          <month>10</month>
          <day>06</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>5009</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41467-020-18849-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41467-020-18849-z</pub-id>
          <pub-id pub-id-type="medline">33024121</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41467-020-18849-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC7538555</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gutierrez</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Mekaru</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sewalk</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Goodwin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Loskill</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cohn</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>Hswen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Cobo</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Zarebski</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hulland</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Morgan</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>O'Brien</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Scarpino</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Pybus</surname>
              <given-names>OG</given-names>
            </name>
            <name name-style="western">
              <surname>Pigott</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Kraemer</surname>
              <given-names>MUG</given-names>
            </name>
          </person-group>
          <article-title>Epidemiological data from the COVID-19 outbreak, real-time case information</article-title>
          <source>Sci Data</source>
          <year>2020</year>
          <month>03</month>
          <day>24</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>106</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41597-020-0448-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-020-0448-0</pub-id>
          <pub-id pub-id-type="medline">32210236</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-020-0448-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC7093412</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hasell</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mathieu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Beltekian</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Macdonald</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Giattino</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ortiz-Ospina</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Roser</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ritchie</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A cross-country database of COVID-19 testing</article-title>
          <source>Sci Data</source>
          <year>2020</year>
          <month>10</month>
          <day>08</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>345</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41597-020-00688-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-020-00688-8</pub-id>
          <pub-id pub-id-type="medline">33033256</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-020-00688-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC7545176</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>FK</given-names>
            </name>
            <name name-style="western">
              <surname>Leavitt</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Ung</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Labrique</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Azman</surname>
              <given-names>AS</given-names>
            </name>
            <collab>HIT-COVID Collaboration</collab>
          </person-group>
          <article-title>HIT-COVID, a global database tracking public health interventions to COVID-19</article-title>
          <source>Sci Data</source>
          <year>2020</year>
          <month>08</month>
          <day>27</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>286</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41597-020-00610-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-020-00610-2</pub-id>
          <pub-id pub-id-type="medline">32855428</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-020-00610-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC7453020</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Desvars-Larrive</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dervic</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Haug</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Niederkrotenthaler</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Di Natale</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lasser</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gliga</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Roux</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sorger</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chakraborty</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ten</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Dervic</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pacheco</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jurczak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cserjan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lederhilger</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bulska</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Berishaj</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tames</surname>
              <given-names>EF</given-names>
            </name>
            <name name-style="western">
              <surname>Álvarez</surname>
              <given-names>FS</given-names>
            </name>
            <name name-style="western">
              <surname>Takriti</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Korbel</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Reddish</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Grzymała-Moszczyńska</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stangl</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hadziavdic</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Stoeger</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gooriah</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Geyrhofer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ferreira</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Bartoszek</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vierlinger</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Holder</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Haberfellner</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ahne</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Reisch</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Servedio</surname>
              <given-names>VDP</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Pocasangre-Orellana</surname>
              <given-names>XM</given-names>
            </name>
            <name name-style="western">
              <surname>Garncarek</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Thurner</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A structured open dataset of government interventions in response to COVID-19</article-title>
          <source>Sci Data</source>
          <year>2020</year>
          <month>08</month>
          <day>27</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>285</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41597-020-00609-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-020-00609-9</pub-id>
          <pub-id pub-id-type="medline">32855430</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-020-00609-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7452888</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Argenziano</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Bruce</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Slater</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Tiao</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Baldwin</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Barr</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>BP</given-names>
            </name>
            <name name-style="western">
              <surname>Chau</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Gavin</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Goyal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mills</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Romney</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Safford</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Schluger</surname>
              <given-names>NW</given-names>
            </name>
            <name name-style="western">
              <surname>Sengupta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sobieszczyk</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Zucker</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Asadourian</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>FM</given-names>
            </name>
            <name name-style="western">
              <surname>Boyd</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Colquhoun</surname>
              <given-names>MI</given-names>
            </name>
            <name name-style="western">
              <surname>Colville</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>de Jonge</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Dershowitz</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Eiseman</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Girvin</surname>
              <given-names>ZP</given-names>
            </name>
            <name name-style="western">
              <surname>Goni</surname>
              <given-names>DT</given-names>
            </name>
            <name name-style="western">
              <surname>Harb</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Herzik</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Householder</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Karaaslan</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lieberman</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ling</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shou</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Sisti</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Snow</surname>
              <given-names>ZE</given-names>
            </name>
            <name name-style="western">
              <surname>Sperring</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Xiong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Natarajan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Characterization and clinical course of 1000 patients with coronavirus disease 2019 in New York: retrospective case series</article-title>
          <source>BMJ</source>
          <year>2020</year>
          <month>05</month>
          <day>29</day>
          <volume>369</volume>
          <fpage>m1996</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/lookup/pmidlookup?view=long&#38;pmid=32471884"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.m1996</pub-id>
          <pub-id pub-id-type="medline">32471884</pub-id>
          <pub-id pub-id-type="pmcid">PMC7256651</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Benitez</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Malin</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Evaluating re-identification risks with respect to the HIPAA privacy rule</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2010</year>
          <volume>17</volume>
          <issue>2</issue>
          <fpage>169</fpage>
          <lpage>177</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/20190059"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/jamia.2009.000026</pub-id>
          <pub-id pub-id-type="medline">20190059</pub-id>
          <pub-id pub-id-type="pii">17/2/169</pub-id>
          <pub-id pub-id-type="pmcid">PMC3000773</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ta</surname>
              <given-names>CN</given-names>
            </name>
            <name name-style="western">
              <surname>Dumontier</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Tatonetti</surname>
              <given-names>NP</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Columbia Open Health Data, clinical concept prevalence and co-occurrence from electronic health records</article-title>
          <source>Sci Data</source>
          <year>2018</year>
          <month>11</month>
          <day>27</day>
          <volume>5</volume>
          <fpage>180273</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/sdata.2018.273"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2018.273</pub-id>
          <pub-id pub-id-type="medline">30480666</pub-id>
          <pub-id pub-id-type="pii">sdata2018273</pub-id>
          <pub-id pub-id-type="pmcid">PMC6257042</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahalt</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Fecho</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Glusman</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hadlock</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>CO</given-names>
            </name>
            <name name-style="western">
              <surname>Pfaff</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>PN</given-names>
            </name>
            <name name-style="western">
              <surname>Solbrig</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ta</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tatonetti</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <collab>Biomedical Data Translator Consortium</collab>
          </person-group>
          <article-title>Clinical Data: Sources and Types, Regulatory Constraints, Applications</article-title>
          <source>Clin Transl Sci</source>
          <year>2019</year>
          <month>07</month>
          <volume>12</volume>
          <issue>4</issue>
          <fpage>329</fpage>
          <lpage>333</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31074176"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/cts.12638</pub-id>
          <pub-id pub-id-type="medline">31074176</pub-id>
          <pub-id pub-id-type="pmcid">PMC6617834</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fecho</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ahalt</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Arunachalam</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Champion</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gersing</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Glusman</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hadlock</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pfaff</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sid</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ta</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Peden</surname>
              <given-names>DB</given-names>
            </name>
            <collab>Biomedical Data Translator Consortium</collab>
          </person-group>
          <article-title>Sex, obesity, diabetes, and exposure to particulate matter among patients with severe asthma: Scientific insights from a comparative analysis of open clinical data sources during a five-day hackathon</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <month>12</month>
          <volume>100</volume>
          <fpage>103325</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30244-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103325</pub-id>
          <pub-id pub-id-type="medline">31676459</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30244-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC6953386</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dyal</surname>
              <given-names>NP</given-names>
            </name>
          </person-group>
          <article-title>First Case of COVID-19 in NYC, First Death Reported in Washington State</article-title>
          <source>Infectious Disease Advisor</source>
          <year>2020</year>
          <month>03</month>
          <day>03</day>
          <access-date>2020-11-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.infectiousdiseaseadvisor.com/home/topics/respiratory/first-case-of-covid-19-in-nyc-first-death-reported-in-washington-state/">https://www.infectiousdiseaseadvisor.com/home/topics/respiratory/first-case-of-covid-19-in-nyc-first-death-reported-in-washington-state/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
          <source>Columbia Open Health Data - COVID-19</source>
          <access-date>2021-09-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://covid.cohd.io/">https://covid.cohd.io/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ta</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>COHD-COVID: Columbia Open Health Data for COVID-19 Research</article-title>
          <source>Figshare</source>
          <access-date>2021-09-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.6084/m9.figshare.14739426.v1">https://doi.org/10.6084/m9.figshare.14739426.v1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ta</surname>
              <given-names>CN</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Detecting Systemic Data Quality Issues in Electronic Health Records</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2019</year>
          <month>08</month>
          <day>21</day>
          <volume>264</volume>
          <fpage>383</fpage>
          <lpage>387</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31437950"/>
          </comment>
          <pub-id pub-id-type="doi">10.3233/SHTI190248</pub-id>
          <pub-id pub-id-type="medline">31437950</pub-id>
          <pub-id pub-id-type="pii">SHTI190248</pub-id>
          <pub-id pub-id-type="pmcid">PMC6857180</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kahn</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Callahan</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Barnard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bauck</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Davidson</surname>
              <given-names>BN</given-names>
            </name>
            <name name-style="western">
              <surname>Estiri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Goerg</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Holve</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Liaw</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hamilton-Lopez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Meeker</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zozus</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Schilling</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>A Harmonized Data Quality Assessment Terminology and Framework for the Secondary Use of Electronic Health Record Data</article-title>
          <source>EGEMS (Wash DC)</source>
          <year>2016</year>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>1244</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27713905"/>
          </comment>
          <pub-id pub-id-type="doi">10.13063/2327-9214.1244</pub-id>
          <pub-id pub-id-type="medline">27713905</pub-id>
          <pub-id pub-id-type="pii">egems1244</pub-id>
          <pub-id pub-id-type="pmcid">PMC5051581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
          <article-title>COVID-19 Daily Counts of Cases, Hospitalizations, and Deaths</article-title>
          <source>NYC Open Data</source>
          <access-date>2021-09-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://data.cityofnewyork.us/resource/rc75-m7u3">https://data.cityofnewyork.us/resource/rc75-m7u3</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Geleris</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Platt</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zucker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Baldwin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Labella</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Manson</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Kubin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Barr</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Sobieszczyk</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Schluger</surname>
              <given-names>NW</given-names>
            </name>
          </person-group>
          <article-title>Observational Study of Hydroxychloroquine in Hospitalized Patients with Covid-19</article-title>
          <source>N Engl J Med</source>
          <year>2020</year>
          <month>06</month>
          <day>18</day>
          <volume>382</volume>
          <issue>25</issue>
          <fpage>2411</fpage>
          <lpage>2418</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32379955"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMoa2012410</pub-id>
          <pub-id pub-id-type="medline">32379955</pub-id>
          <pub-id pub-id-type="pmcid">PMC7224609</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ni</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ou</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Shan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lei</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hui</surname>
              <given-names>DSC</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yuen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Qiu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>N</given-names>
            </name>
            <collab>China Medical Treatment Expert Group for Covid-19</collab>
          </person-group>
          <article-title>Clinical Characteristics of Coronavirus Disease 2019 in China</article-title>
          <source>N Engl J Med</source>
          <year>2020</year>
          <month>04</month>
          <day>30</day>
          <volume>382</volume>
          <issue>18</issue>
          <fpage>1708</fpage>
          <lpage>1720</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32109013"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMoa2002032</pub-id>
          <pub-id pub-id-type="medline">32109013</pub-id>
          <pub-id pub-id-type="pmcid">PMC7092819</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fifi</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Mocco</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>COVID-19 related stroke in young individuals</article-title>
          <source>Lancet Neurol</source>
          <year>2020</year>
          <month>09</month>
          <volume>19</volume>
          <issue>9</issue>
          <fpage>713</fpage>
          <lpage>715</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32822622"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S1474-4422(20)30272-6</pub-id>
          <pub-id pub-id-type="medline">32822622</pub-id>
          <pub-id pub-id-type="pii">S1474-4422(20)30272-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7434432</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oxley</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mocco</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Majidi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kellner</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Shoirah</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>IP</given-names>
            </name>
            <name name-style="western">
              <surname>De Leacy</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Shigematsu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ladner</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Yaeger</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Skliut</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weinberger</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dangayach</surname>
              <given-names>NS</given-names>
            </name>
            <name name-style="western">
              <surname>Bederson</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Tuhrim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fifi</surname>
              <given-names>JT</given-names>
            </name>
          </person-group>
          <article-title>Large-Vessel Stroke as a Presenting Feature of Covid-19 in the Young</article-title>
          <source>N Engl J Med</source>
          <year>2020</year>
          <month>05</month>
          <day>14</day>
          <volume>382</volume>
          <issue>20</issue>
          <fpage>e60</fpage>
          <pub-id pub-id-type="doi">10.1056/NEJMc2009787</pub-id>
          <pub-id pub-id-type="medline">32343504</pub-id>
          <pub-id pub-id-type="pmcid">PMC7207073</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>Biomedical Data Translator Consortium</collab>
          </person-group>
          <article-title>Toward A Universal Biomedical Data Translator</article-title>
          <source>Clin Transl Sci</source>
          <year>2019</year>
          <month>03</month>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>86</fpage>
          <lpage>90</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30412337"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/cts.12591</pub-id>
          <pub-id pub-id-type="medline">30412337</pub-id>
          <pub-id pub-id-type="pmcid">PMC6440568</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>Biomedical Data Translator Consortium</collab>
          </person-group>
          <article-title>The Biomedical Data Translator Program: Conception, Culture, and Community</article-title>
          <source>Clin Transl Sci</source>
          <year>2019</year>
          <month>03</month>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>91</fpage>
          <lpage>94</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30412340"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/cts.12592</pub-id>
          <pub-id pub-id-type="medline">30412340</pub-id>
          <pub-id pub-id-type="pmcid">PMC6440573</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
