<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v23i3e22219</article-id>
      <article-id pub-id-type="pmid">33600347</article-id>
      <article-id pub-id-type="doi">10.2196/22219</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Viewpoint</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Viewpoint</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>What Every Reader Should Know About Studies Using Electronic Health Record Data but May Be Afraid to Ask</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Kukafka</surname>
            <given-names>Rita</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Delvaux</surname>
            <given-names>Nicolas</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Adly</surname>
            <given-names>Mahmoud</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Harris</surname>
            <given-names>Paul</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Adly</surname>
            <given-names>Afnan</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Adly</surname>
            <given-names>Aya</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Li</surname>
            <given-names>Jinfeng</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Genaro</surname>
            <given-names>Luis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Kohane</surname>
            <given-names>Isaac S</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <address>
            <institution>Department of Biomedical Informatics</institution>
            <institution>Harvard Medical School</institution>
            <addr-line>10 Shattuck Street</addr-line>
            <addr-line>Boston, MA, 02115</addr-line>
            <country>United States</country>
            <phone>1 617 432 3226</phone>
            <email>isaac_kohane@harvard.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2192-5160</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Aronow</surname>
            <given-names>Bruce J</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff02" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5109-6514</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Avillach</surname>
            <given-names>Paul</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0235-7543</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Beaulieu-Jones</surname>
            <given-names>Brett K</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6700-1468</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Bellazzi</surname>
            <given-names>Riccardo</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff03" ref-type="aff">3</xref>
          <xref rid="aff04" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6974-9808</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Bradford</surname>
            <given-names>Robert L</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff05" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0908-1428</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Brat</surname>
            <given-names>Gabriel A</given-names>
          </name>
          <degrees>MD, MPH</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3928-5931</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Cannataro</surname>
            <given-names>Mario</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff06" ref-type="aff">6</xref>
          <xref rid="aff07" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1502-2387</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Cimino</surname>
            <given-names>James J</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff08" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4101-1622</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>García-Barrio</surname>
            <given-names>Noelia</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff09" ref-type="aff">9</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2789-8426</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Gehlenborg</surname>
            <given-names>Nils</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0327-8297</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author">
          <name name-style="western">
            <surname>Ghassemi</surname>
            <given-names>Marzyeh</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff10" ref-type="aff">10</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6349-7251</ext-link>
        </contrib>
        <contrib id="contrib13" contrib-type="author">
          <name name-style="western">
            <surname>Gutiérrez-Sacristán</surname>
            <given-names>Alba</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1245-198X</ext-link>
        </contrib>
        <contrib id="contrib14" contrib-type="author">
          <name name-style="western">
            <surname>Hanauer</surname>
            <given-names>David A</given-names>
          </name>
          <degrees>MS, MD</degrees>
          <xref rid="aff11" ref-type="aff">11</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6931-3791</ext-link>
        </contrib>
        <contrib id="contrib15" contrib-type="author">
          <name name-style="western">
            <surname>Holmes</surname>
            <given-names>John H</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff12" ref-type="aff">12</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2167-3602</ext-link>
        </contrib>
        <contrib id="contrib16" contrib-type="author">
          <name name-style="western">
            <surname>Hong</surname>
            <given-names>Chuan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7056-9559</ext-link>
        </contrib>
        <contrib id="contrib17" contrib-type="author">
          <name name-style="western">
            <surname>Klann</surname>
            <given-names>Jeffrey G</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff13" ref-type="aff">13</xref>
          <xref rid="aff14" ref-type="aff">14</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2043-1601</ext-link>
        </contrib>
        <contrib id="contrib18" contrib-type="author">
          <name name-style="western">
            <surname>Loh</surname>
            <given-names>Ne Hooi Will</given-names>
          </name>
          <degrees>MBBS, FRCA, FFICM, EDIC</degrees>
          <xref rid="aff15" ref-type="aff">15</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4114-1286</ext-link>
        </contrib>
        <contrib id="contrib19" contrib-type="author">
          <name name-style="western">
            <surname>Luo</surname>
            <given-names>Yuan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff16" ref-type="aff">16</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0195-7456</ext-link>
        </contrib>
        <contrib id="contrib20" contrib-type="author">
          <name name-style="western">
            <surname>Mandl</surname>
            <given-names>Kenneth D</given-names>
          </name>
          <degrees>MPH, MD</degrees>
          <xref rid="aff17" ref-type="aff">17</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9781-0477</ext-link>
        </contrib>
        <contrib id="contrib21" contrib-type="author">
          <name name-style="western">
            <surname>Daniar</surname>
            <given-names>Mohamad</given-names>
          </name>
          <degrees>MSIS</degrees>
          <xref rid="aff18" ref-type="aff">18</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9031-0835</ext-link>
        </contrib>
        <contrib id="contrib22" contrib-type="author">
          <name name-style="western">
            <surname>Moore</surname>
            <given-names>Jason H</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff19" ref-type="aff">19</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5015-1099</ext-link>
        </contrib>
        <contrib id="contrib23" contrib-type="author">
          <name name-style="western">
            <surname>Murphy</surname>
            <given-names>Shawn N</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <xref rid="aff20" ref-type="aff">20</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1905-8806</ext-link>
        </contrib>
        <contrib id="contrib24" contrib-type="author">
          <name name-style="western">
            <surname>Neuraz</surname>
            <given-names>Antoine</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff21" ref-type="aff">21</xref>
          <xref rid="aff22" ref-type="aff">22</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7142-6728</ext-link>
        </contrib>
        <contrib id="contrib25" contrib-type="author">
          <name name-style="western">
            <surname>Ngiam</surname>
            <given-names>Kee Yuan</given-names>
          </name>
          <degrees>MBBS, MRCS, MMed</degrees>
          <xref rid="aff15" ref-type="aff">15</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5676-2520</ext-link>
        </contrib>
        <contrib id="contrib26" contrib-type="author">
          <name name-style="western">
            <surname>Omenn</surname>
            <given-names>Gilbert S</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff23" ref-type="aff">23</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8976-6074</ext-link>
        </contrib>
        <contrib id="contrib27" contrib-type="author">
          <name name-style="western">
            <surname>Palmer</surname>
            <given-names>Nathan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4361-207X</ext-link>
        </contrib>
        <contrib id="contrib28" contrib-type="author">
          <name name-style="western">
            <surname>Patel</surname>
            <given-names>Lav P</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff24" ref-type="aff">24</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8626-137X</ext-link>
        </contrib>
        <contrib id="contrib29" contrib-type="author">
          <name name-style="western">
            <surname>Pedrera-Jiménez</surname>
            <given-names>Miguel</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff09" ref-type="aff">9</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0187-3826</ext-link>
        </contrib>
        <contrib id="contrib30" contrib-type="author">
          <name name-style="western">
            <surname>Sliz</surname>
            <given-names>Piotr</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff17" ref-type="aff">17</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6522-0835</ext-link>
        </contrib>
        <contrib id="contrib31" contrib-type="author">
          <name name-style="western">
            <surname>South</surname>
            <given-names>Andrew M</given-names>
          </name>
          <degrees>MS, MD</degrees>
          <xref rid="aff25" ref-type="aff">25</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3204-4142</ext-link>
        </contrib>
        <contrib id="contrib32" contrib-type="author">
          <name name-style="western">
            <surname>Tan</surname>
            <given-names>Amelia Li Min</given-names>
          </name>
          <degrees>BSc, PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <xref rid="aff26" ref-type="aff">26</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0623-6623</ext-link>
        </contrib>
        <contrib id="contrib33" contrib-type="author">
          <name name-style="western">
            <surname>Taylor</surname>
            <given-names>Deanne M</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff27" ref-type="aff">27</xref>
          <xref rid="aff28" ref-type="aff">28</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3302-4610</ext-link>
        </contrib>
        <contrib id="contrib34" contrib-type="author">
          <name name-style="western">
            <surname>Taylor</surname>
            <given-names>Bradley W</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff29" ref-type="aff">29</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6414-4172</ext-link>
        </contrib>
        <contrib id="contrib35" contrib-type="author">
          <name name-style="western">
            <surname>Torti</surname>
            <given-names>Carlo</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff07" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7631-5453</ext-link>
        </contrib>
        <contrib id="contrib36" contrib-type="author">
          <name name-style="western">
            <surname>Vallejos</surname>
            <given-names>Andrew K</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff29" ref-type="aff">29</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6543-5430</ext-link>
        </contrib>
        <contrib id="contrib37" contrib-type="author">
          <name name-style="western">
            <surname>Wagholikar</surname>
            <given-names>Kavishwar B</given-names>
          </name>
          <degrees>MBBS, PhD</degrees>
          <xref rid="aff13" ref-type="aff">13</xref>
          <xref rid="aff14" ref-type="aff">14</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6219-861X</ext-link>
        </contrib>
        <contrib id="contrib38" contrib-type="author">
          <collab>The Consortium For Clinical Characterization Of COVID-19 By EHR (4CE)</collab>
          <xref rid="aff30" ref-type="aff">30</xref>
        </contrib>
        <contrib id="contrib39" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Weber</surname>
            <given-names>Griffin M</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2597-881X</ext-link>
        </contrib>
        <contrib id="contrib40" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Cai</surname>
            <given-names>Tianxi</given-names>
          </name>
          <degrees>SCD</degrees>
          <xref rid="aff01" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5379-2502</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff01">
        <label>1</label>
        <institution>Department of Biomedical Informatics</institution>
        <institution>Harvard Medical School</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff02">
        <label>2</label>
        <institution>Biomedical Informatics</institution>
        <institution>Cincinnati Children's Hospital Medical Center</institution>
        <institution>University of Cincinnati</institution>
        <addr-line>Cincinnati, OH</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff03">
        <label>3</label>
        <institution>Department of Electrical, Computer and Biomedical Engineering</institution>
        <institution>University of Pavia</institution>
        <addr-line>Pavia</addr-line>
        <country>Italy</country>
      </aff>
      <aff id="aff04">
        <label>4</label>
        <institution>ICS Maugeri</institution>
        <addr-line>Pavia</addr-line>
        <country>Italy</country>
      </aff>
      <aff id="aff05">
        <label>5</label>
        <institution>North Carolina Translational and Clinical Sciences Institute</institution>
        <institution>University of North Carolina at Chapel Hill</institution>
        <addr-line>Chapel Hill, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff06">
        <label>6</label>
        <institution>Data Analytics Research Center</institution>
        <institution>University Magna Graecia of Catanzaro</institution>
        <addr-line>Catanzaro</addr-line>
        <country>Italy</country>
      </aff>
      <aff id="aff07">
        <label>7</label>
        <institution>Department of Medical and Surgical Sciences</institution>
        <institution>University Magna Graecia of Catanzaro</institution>
        <addr-line>Catanzaro</addr-line>
        <country>Italy</country>
      </aff>
      <aff id="aff08">
        <label>8</label>
        <institution>Informatics Institute</institution>
        <institution>University of Alabama at Birmingham</institution>
        <addr-line>Birmingham, AL</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff09">
        <label>9</label>
        <institution>Department of Informatics</institution>
        <institution>12 de Octubre University Hospital</institution>
        <addr-line>Madrid</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff10">
        <label>10</label>
        <institution>Department of Computer Science and Medicine</institution>
        <institution>University of Toronto</institution>
        <addr-line>Toronto, ON</addr-line>
        <country>Canada</country>
      </aff>
      <aff id="aff11">
        <label>11</label>
        <institution>Department of Learning Health Sciences</institution>
        <institution>University of Michigan Medical School</institution>
        <addr-line>Ann Arbor, MI</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff12">
        <label>12</label>
        <institution>Department of Biostatistics, Epidemiology, and Informatics</institution>
        <institution>Perelman School of Medicine</institution>
        <institution>University of Pennsylvania</institution>
        <addr-line>Philadelphia, PA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff13">
        <label>13</label>
        <institution>Department of Medicine</institution>
        <institution>Harvard Medical School</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff14">
        <label>14</label>
        <institution>Laboratory of Computer Science</institution>
        <institution>Massachusetts General Hospital</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff15">
        <label>15</label>
        <institution>National University Health Systems</institution>
        <addr-line>Singapore</addr-line>
        <country>Singapore</country>
      </aff>
      <aff id="aff16">
        <label>16</label>
        <institution>Department of Preventive Medicine</institution>
        <institution>Northwestern University</institution>
        <addr-line>Chicago, IL</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff17">
        <label>17</label>
        <institution>Computational Health Informatics Program</institution>
        <institution>Boston Children's Hospital</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff18">
        <label>18</label>
        <institution>Clinical Research Informatics</institution>
        <institution>Boston Children's Hospital</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff19">
        <label>19</label>
        <institution>Institute for Biomedical Informatics</institution>
        <institution>University of Pennsylvania</institution>
        <addr-line>Philadelphia, PA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff20">
        <label>20</label>
        <institution>Department of Neurology</institution>
        <institution>Massachusetts General Hospital</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff21">
        <label>21</label>
        <institution>Department of Biomedical Informatics</institution>
        <institution>Necker-Enfant Malades Hospital</institution>
        <institution>Assistance Publique - Hôpitaux de Paris</institution>
        <addr-line>Paris</addr-line>
        <country>France</country>
      </aff>
      <aff id="aff22">
        <label>22</label>
        <institution>Centre de Recherche des Cordeliers</institution>
        <institution>INSERM UMRS 1138 Team 22</institution>
        <institution>Université de Paris</institution>
        <addr-line>Paris</addr-line>
        <country>France</country>
      </aff>
      <aff id="aff23">
        <label>23</label>
        <institution>Department of Computational Medicine &#38; Bioinformatics</institution>
        <institution>University of Michigan</institution>
        <addr-line>Ann Arbor, MI</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff24">
        <label>24</label>
        <institution>Department of Internal Medicine</institution>
        <institution>Division of Medical Informatics</institution>
        <institution>University of Kansas Medical Center</institution>
        <addr-line>Kansas City, KS</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff25">
        <label>25</label>
        <institution>Section of Nephrology, Department of Pediatrics</institution>
        <institution>Brenner Children's Hospital</institution>
        <institution>Wake Forest School of Medicine</institution>
        <addr-line>Winston Salem, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff26">
        <label>26</label>
        <institution>Department of Biomedical Informatics</institution>
        <institution>National University of Singapore</institution>
        <addr-line>Singapore</addr-line>
        <country>Singapore</country>
      </aff>
      <aff id="aff27">
        <label>27</label>
        <institution>Department of Biomedical and Health Informatics</institution>
        <institution>The Children's Hospital of Philadelphia</institution>
        <addr-line>Philadelphia, PA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff28">
        <label>28</label>
        <institution>Department of Pediatrics</institution>
        <institution>Perelman School of Medicine</institution>
        <institution>The University of Pennsylvania</institution>
        <addr-line>Philadelphia, PA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff29">
        <label>29</label>
        <institution>Clinical and Translational Science Institute</institution>
        <institution>Medical College of Wisconsin</institution>
        <addr-line>Milwaukee, WI</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff30">
        <label>30</label>
        <institution>See Acknowledgments</institution>
      </aff>
      <pub-date pub-type="collection">
        <month>3</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>2</day>
        <month>3</month>
        <year>2021</year>
      </pub-date>
      <volume>23</volume>
      <issue>3</issue>
      <elocation-id>e22219</elocation-id>
      <history>
        <date date-type="received">
          <day>13</day>
          <month>7</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>4</day>
          <month>8</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>14</day>
          <month>9</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>10</day>
          <month>1</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Isaac S Kohane, Bruce J Aronow, Paul Avillach, Brett K Beaulieu-Jones, Riccardo Bellazzi, Robert L Bradford, Gabriel A Brat, Mario Cannataro, James J Cimino, Noelia García-Barrio, Nils Gehlenborg, Marzyeh Ghassemi, Alba Gutiérrez-Sacristán, David A Hanauer, John H Holmes, Chuan Hong, Jeffrey G Klann, Ne Hooi Will Loh, Yuan Luo, Kenneth D Mandl, Mohamad Daniar, Jason H Moore, Shawn N Murphy, Antoine Neuraz, Kee Yuan Ngiam, Gilbert S Omenn, Nathan Palmer, Lav P Patel, Miguel Pedrera-Jiménez, Piotr Sliz, Andrew M South, Amelia Li Min Tan, Deanne M Taylor, Bradley W Taylor, Carlo Torti, Andrew K Vallejos, Kavishwar B Wagholikar,  The Consortium For Clinical Characterization Of COVID-19 By EHR (4CE), Griffin M Weber, Tianxi Cai. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 02.03.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2021/3/e22219" xlink:type="simple"/>
      <abstract>
        <p>Coincident with the tsunami of COVID-19–related publications, there has been a surge of studies using real-world data, including those obtained from the electronic health record (EHR). Unfortunately, several of these high-profile publications were retracted because of concerns regarding the soundness and quality of the studies and the EHR data they purported to analyze. These retractions highlight that although a small community of EHR informatics experts can readily identify strengths and flaws in EHR-derived studies, many medical editorial teams and otherwise sophisticated medical readers lack the framework to fully critically appraise these studies. In addition, conventional statistical analyses cannot overcome the need for an understanding of the opportunities and limitations of EHR-derived studies. We distill here from the broader informatics literature six key considerations that are crucial for appraising studies utilizing EHR data: data completeness, data collection and handling (eg, transformation), data type (ie, codified, textual), robustness of methods against EHR variability (within and across institutions, countries, and time), transparency of data and analytic code, and the multidisciplinary approach. These considerations will inform researchers, clinicians, and other stakeholders as to the recommended best practices in reviewing manuscripts, grants, and other outputs from EHR-data derived studies, and thereby promote and foster rigor, quality, and reliability of this rapidly growing field.</p>
      </abstract>
      <kwd-group>
        <kwd>COVID-19</kwd>
        <kwd>electronic health records</kwd>
        <kwd>real-world data</kwd>
        <kwd>literature</kwd>
        <kwd>publishing</kwd>
        <kwd>quality</kwd>
        <kwd>data quality</kwd>
        <kwd>reporting standards</kwd>
        <kwd>reporting checklist</kwd>
        <kwd>review</kwd>
        <kwd>statistics</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>What should researchers and clinicians conclude about the recent high-profile retractions of COVID-19 studies based on electronic health record (EHR) data? It is impressive that two publications involving patients with COVID-19, one in The Lancet [<xref ref-type="bibr" rid="ref1">1</xref>] and the other in the New England Journal of Medicine [<xref ref-type="bibr" rid="ref2">2</xref>], were determined to be unsound and were retracted in less than 2 months from publication, as these journals’ review processes and quality checks are among the most rigorous in the world. Yet, upon closer inspection by those of us familiar with EHR-based research, there were many flaws to these studies involving data quality issues and a lack of transparency that should have been more readily identified during the peer and editorial review process. This is not to say that in-depth statistical analysis might not have eventually uncovered concerns but rather to point out incongruities and anomalies unique to EHR-based studies that should immediately raise concerns to experienced biomedical informaticians, much like an experienced contractor explaining to a homeowner why a competing bid is too good to be true.</p>
      <p>In this viewpoint, we present six key questions that are necessary to consider when appraising EHR-based research, especially for research studies investigating the pandemic:</p>
      <list list-type="order">
        <list-item>
          <p>How complete are the data?</p>
        </list-item>
        <list-item>
          <p>How were the data collected and handled?</p>
        </list-item>
        <list-item>
          <p>What were the specific data types?</p>
        </list-item>
        <list-item>
          <p>Did the analysis account for EHR variability?</p>
        </list-item>
        <list-item>
          <p>Are the data and analytic code transparent?</p>
        </list-item>
        <list-item>
          <p>Was the study appropriately multidisciplinary?</p>
        </list-item>
      </list>
      <p>In particular, we focus on general aspects of these questions that are crucial to study and data quality and validity of and interpretability of the results and that are broadly applicable to many stakeholders, including researchers and clinicians, in order to optimize the review of submitted manuscripts, published studies, and grant applications containing preliminary data. These desiderata were compiled by the 96 members of the Consortium for Clinical Characterization of COVID-19 by EHR (4CE)—a self-assembled group of collaborating hospitals focused specifically on studying the clinical course of patients with COVID-19 using EHR-based data—most of whom are biomedical informaticians—across 7 countries. 4CE members were invited to contribute their specific key concerns to a shared checklist. This list was then pared down into a less technical list for a more general audience. We excluded those items that are generally considered to be good biostatistical practices (eg, manual review of sample data sets, detecting and understanding outliers [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]) to present EHR-specific concerns to a broad biomedical audience. We also excluded recommendations that are contained within the Reporting of Studies Conducted Using Observational Routinely Collected Health Data (RECORD) statement [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>], which are not specific to EHR-derived data. Finally, we did not focus on the specific limitations of EHR-derived studies, which have been amply documented [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>], or on the methods to minimize the impact of these limitations, as this viewpoint is not focused on reviewing specific methodological options for investigators using EHR-derived data, which has been reviewed in detail previously [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. We acknowledge that there are many other criteria that can inform evaluations of EHR-based studies, but we have purposefully limited this discussion to those issues that are most relevant to a general audience, centered on studies investigating the pandemic.</p>
    </sec>
    <sec>
      <title>Data Completeness</title>
      <p>There are several statistical tests to query data completeness and methods for incorporating missing data [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>], but here we describe the reasonable expectations for such completeness with knowledge of current, state-of-the-art EHR usage. A publication that is specific about which data were obtained from the EHR (eg, specific laboratory tests or billing codes) is more credible than a study that simply claims it obtained 100% of the EHR data (as did the two recently retracted publications [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]). The range of data types from EHRs is extensive and highly varied; each data type requires its own specific quality control and transformations to standard terminologies. For example, laboratory measurements alone can have as many as hundreds of thousands of local codes at a large health care system such as the Veterans Health Administration. In many cases, these data require some level of manual record review to assure data quality and completeness.</p>
      <p>Similarly, if a study reports a deidentification procedure, it must describe the details of said procedure. The goals of the deidentification process determine the nature of the deidentification process and the associated regulatory requirements. For example, US hospitals can meet HIPAA (Health Insurance Portability and Accountability Act) standards [<xref ref-type="bibr" rid="ref14">14</xref>] if they require obfuscation of the counts of patients with rare clinical presentations below a specified prevalence threshold and if they employ date shifting. Knowledge of these methods is essential to analyzing and interpreting the derived data.</p>
      <p>Some data types are represented theoretically in the EHR but in practice are only recorded occasionally. For example, standardized codes for smoking history or a family history of specific diseases exist but their underuse is well known. Thus, one cannot assume that the lack of smoking history codes equates to the patient being a nonsmoker. In such scenarios, one must provide an explicit description of the management of missing/null values. Many data elements, such as a complete pulmonary function test, exist in a fragmented form, scattered across different fields in the EHR, and are difficult to extract reliably. In addition, clinical notes allow clinicians greater qualitative expressivity on some of the above values, like smoking history, where they are documented more frequently but not consistently. The quality criteria for reporting narrative content from clinical notes are further addressed below.</p>
      <p>Many clinical states are not represented explicitly in the EHR but can be inferred (often referred to as computational phenotypes). When a publication refers to hyperlipidemia, readers should ask themselves whether the hyperlipidemic phenotype is assessed from one or more lipid laboratory tests, billing diagnostic codes, prescription of lipid-lowering medication, or a combination of the above. It is important to document if only structured codes were used or if the phenotype was defined based on information extracted from clinical notes by using natural language processing (NLP) or manual chart review. Either a table describing these phenotypic methods or a reference to a public set of definitions (eg, Phenotype Knowledgebase, PheKB [<xref ref-type="bibr" rid="ref15">15</xref>]) or a published algorithm with reported accuracy (as seen, for example, in Zhang et al [<xref ref-type="bibr" rid="ref16">16</xref>] and Ananthakrishnan et al [<xref ref-type="bibr" rid="ref17">17</xref>]) can provide transparency and precision to these EHR-driven computational phenotypes. The lack of this transparency should be a warning sign. If onset time or temporal trends of clinical events are used as outcomes, it is important to provide sufficient details on how the data were used to derive these outcomes, how granular time was incorporated (eg, by day, 24-hour period, or hour/minute), and to comment on their accuracy, since EHR data are particularly noisy with regards to capturing the timing of events [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>].</p>
      <p>If one uses EHR data to obtain population estimates (eg, prevalence of a complication per 100,000 patients), then additional information should be provided so that readers can determine which subset of patients from that population a given hospital’s EHR can capture. For example, if the EHR captures a patient’s hospitalization for heart failure, will the EHR also capture the preceding or subsequent outpatient clinic visits related to that hospitalization? With health maintenance organizations, such as Kaiser Permanente, that is much less of a concern, but many hospitals operate in a patchwork system where the patient’s data are spread across multiple heterogeneous EHRs that do not necessarily communicate. In our recent COVID-19 study [<xref ref-type="bibr" rid="ref20">20</xref>], we found many instances in which patients with COVID-19 were transferred from another hospital; unless that other hospital was part of our consortium, it was impossible to have a complete record of their COVID-19 clinical course. It is also important to recognize that a given EHR may not fully capture the clinical course of certain patients, such as those infected with SAR-CoV-2 who have mild symptoms and are discharged home from the emergency room. In these instances, integration of EHR data with data from other sources (eg, primary care providers’ offices or nursing homes) may increase the reliability of analysis, although in practice this is rare and such integration methods have to be well documented. EHR systems may also fail to capture acute events that occur outside of the system, especially in the coded data. Leveraging NLP data from the clinical notes can potentially recover partial information if the patient has follow-up visits within that particular system.</p>
    </sec>
    <sec>
      <title>Data Collection and Handling</title>
      <p>Often the units of measurement and the codes used for data elements like laboratory tests, medications, and diagnoses are not the same across hospitals and may even differ within the same health care system or change over time. Single analytic concepts (eg, the troponin T test) can balloon into dozens of local codes at each hospital, since these tests may be performed at different diagnostic laboratories, each with its own distinct codes or with different technologies over time. Therefore, they have to be “harmonized,” or mapped, to agreed-upon standard terminologies and scales [<xref ref-type="bibr" rid="ref21">21</xref>]. Even when they are the same, their meaning can differ based on population or practice differences (eg, which sensitive troponin test is used or which reference range defines a test result being normal, or in children rather than in adults, whose normative values often change across the age range) [<xref ref-type="bibr" rid="ref7">7</xref>]. In both instances, readers should expect that the specific procedures for harmonization or site-specific semantic alignment are described adequately in the Methods section (or via supplementary materials). A summary of this process can become increasingly complex within the usual confines of a Methods section for multisite and international studies where, by necessity, the site-by-site variability is high.</p>
    </sec>
    <sec>
      <title>Data Type</title>
      <p>There are large methodological divides and divergent ethical challenges between codified data (eg, discrete laboratory values such as serum glucose) and narrative text (eg, discharge summary) from which characterizations are obtained using NLP. While both data types have their own limitations, methods that incorporate both can greatly improve the sensitivity and/or specificity of the clinical characterizations and phenotyping of a group of patients. For example, signs and symptoms are often not codified discreetly or consistently (eg, not entered into the EHR’s Problem List) but are written in the clinical notes. Similarly, outpatient medication documentation in clinical notes does not necessarily represent accurately the medications that the patient is actually taking, but prescriptions entered into the EHR may. Combining both codified and NLP data can substantially improve sensitivity and/or specificity and ideally one should always use this complementarity [<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. For example, only about 10% of pregnant women with suicide ideation have related codes and vast majority of the cases are only documented in the notes [<xref ref-type="bibr" rid="ref25">25</xref>]. However, the ability to extract NLP data and the accuracy of those data may be limited by each institution’s informatics infrastructure and expertise as well as local institutional review board (IRB) constraints. Furthermore, NLP application to clinical narrative text is relatively new and more prone to large variability in the quality of the obtained characterizations. Particularly in countries with different languages, the NLP techniques and their performance may vary widely. For this reason, readers should expect a reference to the specific NLP methods used and their performance characteristics on data of the sort that the study collected and analyzed. For example, if someone describes the use of an NLP approach on discharge summaries in intensive care units in Italy, but the provided citation was validated only for use in outpatient notes written in English, readers can be legitimately concerned about the accuracy and validity of the patient characterizations in that study. Furthermore, if a study claims very high accuracy, readers should expect a report (or citation of a report) that shows an expert review of the NLP method validated against a representative sample confirming the claimed performance.</p>
    </sec>
    <sec>
      <title>Robustness Against EHR Variability</title>
      <p>Beyond any variation in human biology across countries and continents, different styles of practice, and how different reimbursement schemes influence styles of practice and use of EHRs, have a very large impact on the nature of EHR data. Therefore, a multinational study should at least acknowledge these differences as a limitation or explicitly attempt to account for them in the analyses. For example, in COVID-19–related research, it has become increasingly apparent that there is an association between patient race/ethnicity and their risk for acquisition of and complications from COVID-19. However, this association is much less detectable in EHR data, as, for example, it is mostly invisible in data from Europe because several countries forbid collecting self-reported race in the EHR. Even in the United States, the coding of different ethnicities or multiracial identification is not standardized. In addition, some countries have far more comprehensive primary care EHR data sharing, whereas others (like the United States) cannot aggregate data systematically and consistently across major health care centers.</p>
    </sec>
    <sec>
      <title>Transparency</title>
      <p>In order to ensure patients’ rights to privacy, patient-level data can rarely be shared outside an institution. In many EHR-driven studies, the code to extract data from a source EHR can be protected by confidentiality agreements with the EHR vendor and is thus difficult to share. Nonetheless, the code or algorithm for creating the variables used for analyses should be provided even if the detailed data extraction procedures are not shared because of commercial restrictions. Running the code on synthetic data sets that follow a standard data model can demonstrate code functionality and facilitate code reuse [<xref ref-type="bibr" rid="ref26">26</xref>]. The code used to conduct statistical analyses and create visualizations—after data extraction—should also be shared in public repositories to enable other researchers to follow each step of the analysis and provide further transparency. While there are significant challenges to sharing patient-level data, one can share intermediate results and aggregate distributions to increase transparency and understand between-institution differences [<xref ref-type="bibr" rid="ref27">27</xref>]. One should archive the data used for analyses, along with the associated data extraction codes, at the local institution to ensure reproducibility. Authors should also make the deidentified data available—either publicly in a repository or by request. While only a small fraction of readers typically look at the code, whether referenced on a file server or shared as supplementary methods, the availability of the code provides reassurance and validation that the study utilized proper methodologies.</p>
    </sec>
    <sec>
      <title>Multidisciplinary Approach</title>
      <p>There may come a time when data can be aggregated automatically from multiple EHR environments to answer a particular question without relying on a human to understand the particular idiosyncrasies of each institution’s data and EHR system. Until that day, effective EHR data set analysis requires collaboration with clinicians and scientists who have knowledge of the diseases being studied and the practices of their particular health care systems; informaticians with experience in the underlying structures of biomedical record repositories at their own institutions and the characteristics of their data; data harmonization experts to help with data transformation, standardization, integration, and computability; statisticians and epidemiologists well versed in the limitations and opportunities of EHR data sets and related sources of potential bias; machine learning experts; and at least one expert in regulatory and ethical standards. Data provenance records should already exist to ensure compliance with privacy standards, so that authors can readily point to these processes and reference institutional officials who grant data access similarly to IRBs. In our experience, we often have an interdisciplinary team participate in the process of establishing the research question and study design, defining the data elements, and determining what analyses can be performed given the available data. It is also important that people with complementary skills work together to review and interpret the results [<xref ref-type="bibr" rid="ref28">28</xref>]. Each of these steps is a major contribution deserving of authorship. Just as a population genetics study reporting across countries often has dozens of authors, so do we expect multihospital EHR-driven studies to acknowledge and name the individuals as authors and in doing so provide accountability for the dozens of procedures, checks, and balances necessary for the reliable extraction of EHR patient data. Consequently, contribution statements should list explicitly the responsibilities of each author with regard to study conceptualization and design, data extraction, data harmonization, data integration, data analysis, results interpretation, and regulatory and ethical oversight. Additionally, although reputation is sometimes overvalued, having <italic>no</italic> reputation or at least a track record of appropriate success should trigger greater attention to documenting the process to reach the same level of trust. Unlike a mathematical proof, simple inspection of the data may be insufficient and will become increasingly so in the era of data generated by machine learning algorithms purposefully built for the task of conditioning data to appear real. Trust and accountability become essential companions to transparency and clarity during the EHR analytic process.</p>
    </sec>
    <sec>
      <title>Conclusion</title>
      <p>Similar to publications from the early days of the genomic revolution, which initially included extensive sections on DNA sequencing validation, methods, reagents, and conditions that became progressively briefer as trust was built and the methods commoditized, comprehensively and transparently reported methods of EHR data extraction and transformation are at least as important as subsequent statistical analysis and interpretation. We need to be open and transparent about the inherent limitations of the data and the analyses. We should also acknowledge alternative interpretations of the results (eg, outlier prescribing practices in one country that confound the apparent effects of that drug in that country). Extra caution is also needed in how we draw causal inferences from EHR data, especially given the noisiness and incompleteness of the data in addition to several sources of bias, though application of a causal model framework and specific causal inference methods may help mitigate some of these concerns. The recommendations we have outlined here (see <xref ref-type="table" rid="table1">Table 1</xref> for our 12-item checklist) do not substitute for a durable research infrastructure that would enable tracking EHR data provenance along explicit source, ownership, and data protocols, which would allow for rigorous and routine quality assurance in the use of EHR data [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>12-item checklist to assess electronic health record (EHR) data–driven studies.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="230"/>
          <col width="410"/>
          <col width="360"/>
          <thead>
            <tr valign="top">
              <td>Item</td>
              <td>Reassuring</td>
              <td>Concerning</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Defining study cohort/data extraction</td>
              <td>Reporting the precise definition of the domains and/or subsets of EHR data extracted for the study cohort and the information system sources</td>
              <td>100% of the EHR said to be extracted or no specification of which subsets of the EHR data were obtained</td>
            </tr>
            <tr valign="top">
              <td>Deidentification</td>
              <td>Specific deidentification algorithm documented with acknowledgment of analytic consequences/limitations</td>
              <td>Only a statement that deidentification was performed</td>
            </tr>
            <tr valign="top">
              <td>Defining clinical variables/data type–specific omissions/limitations</td>
              <td>For data types represented poorly in EHR codified data, either NLP<sup>a</sup> is deployed on the EHR clinical notes or additional data sources (eg, self-reported questionnaires) are used. Procedures to deal with missing values should also be made explicit</td>
              <td>Referencing data types like family/social history without explaining how they are obtained through NLP or exceptional codified data practice</td>
            </tr>
            <tr valign="top">
              <td>Phenotypic transparency</td>
              <td>Computational phenotypes that are more than just a specific native EHR variable (eg, hyperlipidemia vs a specific LDL<sup>b</sup> measurement) are either defined in the study or a citation is given to algorithmic phenotype definitions</td>
              <td>Clinical phenotypes are used in the study without specifying how they were derived from the EHR data</td>
            </tr>
            <tr valign="top">
              <td>Generalizing EHR findings to the population/population denominator</td>
              <td>Study heavily cautions on using prevalence/incidence estimates from the EHR data or refers to empirical estimates on how much of a patient’s entire health care is captured in that particular EHR</td>
              <td>Direct estimates of prevalence or incidence from EHR frequencies without justifying that generalization</td>
            </tr>
            <tr valign="top">
              <td>Data collection</td>
              <td>Clinical forms or data models implemented in health care information systems are shared or clearly described. This includes the coding systems used</td>
              <td>Mention structured data without specifying the clinical forms or data models. Mention coded data without mentioning coding systems</td>
            </tr>
            <tr valign="top">
              <td>Data transformation/harmonization</td>
              <td>Data transformation process shared or clear description of which methods were used to harmonize data to a standardized terminology, scale units, and account for different local usage</td>
              <td>Mention of harmonization methods without specifying which ones and what problems were identified and addressed/overcome</td>
            </tr>
            <tr valign="top">
              <td>Textual vs codified data</td>
              <td>If textual data are used in the study, then specification of which clinical notes, in what language, with which NLP algorithm with either an explanation of or a citation to that algorithm’s validation, sensitivity, and specificity for comparable data</td>
              <td>Harmonization efforts for codified and textual data treated as if they are the same process. Lack of specificity in describing the NLP algorithm and performance</td>
            </tr>
            <tr valign="top">
              <td>Manual coding of data</td>
              <td>Qualifications of coders described, formal coding criteria described or at least mentioned, intercoder reliability measured and reported</td>
              <td>No description of process for turning text or nonstandard coded data into standard coded data; use of crowd-sourced coders (eg, graduate students or Mechanical Turk) without mention of quality assurance processes</td>
            </tr>
            <tr valign="top">
              <td>Regional and global variation</td>
              <td>A study describes how they adjust for (or exclude) differences that are due to variation in practice, regulation, and clinical documentation through the EHR from site to site</td>
              <td>A study says they adjusted for regional or country differences in practice or EHR documentation but do not describe how they do it</td>
            </tr>
            <tr valign="top">
              <td>Sharing analytic code</td>
              <td>Analytic code is deposited in a public repository or study-specific public website</td>
              <td>Code is not shared or only “shared on demand”</td>
            </tr>
            <tr valign="top">
              <td>Acknowledge a multidisciplinary team</td>
              <td>Authorships for all parts of the extraction-through-analysis pipeline with precision as to each contribution</td>
              <td>Health care system sources not named or local health care system site collaborators not named</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table1fn1">
            <p><sup>a</sup>NLP: natural language processing.</p>
          </fn>
          <fn id="table1fn2">
            <p><sup>b</sup>LDL: low-density lipoprotein.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>Finally, in crises such as the COVID-19 pandemic, we need to recognize that many studies can contribute to our understanding of what is happening to our patients and how our practices might affect patient outcomes. Overly generalized conclusions will likely strain the boundaries of what can be reasonably inferred from the kinds of data currently obtained through EHRs. Recommendations that flow from overly broad claims may irreversibly harm stakeholders, including patients and clinicians. Increased reader awareness of EHR-derived data quality indicators is crucial in critically appraising EHR-driven studies and to prevent harm from misleading studies, which will ensure sustainable quality in this rapidly growing field.</p>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">4CE</term>
          <def>
            <p>Consortium for Clinical Characterization of COVID-19 by EHR</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">HIPAA</term>
          <def>
            <p>Health Insurance Portability and Accountability Act</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">RECORD</term>
          <def>
            <p>Reporting of Studies Conducted Using Observational Routinely Collected Health Data</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">IRB</term>
          <def>
            <p>institutional review board</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">PheKB</term>
          <def>
            <p>Phenotype Knowledgebase</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The members of the Consortium for Clinical Characterization of COVID-19 By EHR (4CE) are as follows: Adem Albayrak, Danilo F Amendola, Li LLJ Anthony, Bruce J Aronow, Andrew Atz, Paul Avillach, Brett K Beaulieu-Jones, Douglas S Bell, Antonio Bellasi, Riccardo Bellazzi, Vincent Benoit, Michele Beraghi, José Luis Bernal Sobrino, Mélodie Bernaux, Romain Bey, Alvar Blanco Martínez, Martin Boeker, Clara-Lea Bonzel, John Booth, Silvano Bosari, Florence T Bourgeois, Robert L Bradford, Gabriel A Brat, Stéphane Bréant, Mauro Bucalo, Anita Burgun, Tianxi Cai, Mario Cannataro, Aize Cao, Charlotte Caucheteux, Julien Champ, Luca Chiovato, James J Cimino, Tiago K Colicchio, Sylvie Cormont, Sébastien Cossin, Jean Craig, Juan Luis Cruz Bermúdez, Arianna Dagliati, Mohamad Daniar, Christel Daniel, Anahita Davoudi, Batsal Devkota, Julien Dubiel, Scott L DuVall, Loic Esteve, Shirley Fan, Robert W Follett, Paula SA Gaiolla, Thomas Ganslandt, Noelia García Barrio, Nils Gehlenborg, Alon Geva, Tobias Gradinger, Alexandre Gramfort, Romain Griffier, Nicolas Griffon, Olivier Grisel, Alba Gutiérrez-Sacristán, David A Hanauer, Christian Haverkamp, Martin Hilka, John H Holmes, Chuan Hong, Petar Horki, Meghan R Hutch, Richard Issitt, Anne Sophie Jannot, Vianney Jouhet, Mark S Keller, Katie Kirchoff, Jeffrey G Klann, Isaac S Kohane, Ian D Krantz, Detlef Kraska, Ashok K Krishnamurthy, Sehi L’Yi, Trang T Le, Judith Leblanc, Guillaume Lemaitre, Leslie Lenert, Damien Leprovost, Molei Liu, Ne Hooi Will Loh, Yuan Luo, Kristine E Lynch, Sadiqa Mahmood, Sarah Maidlow, Alberto Malovini, Kenneth D Mandl, Chengsheng Mao, Patricia Martel, Aaron J Masino, Michael E Matheny, Thomas Maulhardt, Michael T McDuffie, Arthur Mensch, Marcos F Minicucci, Bertrand Moal, Jason H Moore, Jeffrey S Morris, Michele Morris, Karyn L Moshal, Sajad Mousavi, Danielle L Mowery, Douglas A Murad, Shawn N Murphy, Kee Yuan Ngiam, Jihad Obeid, Marina P Okoshi, Karen L Olson, Gilbert S Omenn, Nina Orlova, Brian D Ostasiewski, Nathan P Palmer, Nicolas Paris, Lav P Patel, Miguel Pedrera Jimenez, Hans U Prokosch, Robson A Prudente, Rachel B Ramoni, Maryna Raskin, Siegbert Rieg, Gustavo Roig Domínguez, Elisa Salamanca, Malarkodi J Samayamuthu, Arnaud Sandrin, Emily Schiver, Juergen Schuettler, Luigia Scudeller, Neil Sebire, Pablo Serrano Balazote, Patricia Serre, Arnaud Serret-Larmande, Domenick Silvio, Piotr Sliz, Jiyeon Son, Andrew M South, Anastasia Spiridou, Amelia LM Tan, Bryce WQ Tan, Byorn WL Tan, Suzana E Tanni, Deanne M Taylor, Valentina Tibollo, Patric Tippmann, Andrew K Vallejos, Gael Varoquaux, Jill-Jênn Vie, Shyam Visweswaran, Kavishwar B Wagholikar, Lemuel R Waitman, Demian Wassermann, Griffin M Weber, Yuan William, Zongqi Xia, Alberto Zambelli, Aldo Carmona, Charles Sonday, and James Balshi.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>ISK led the 4CE international consortium, conceived and designed the study, and drafted the manuscript. TC led 4CE analytics strategies and made contributions to the study design and drafting of the manuscript. JJC contributed a validation strategy and made edits to the manuscript. NG-B was responsible for data extraction and transformation to 4CE format and quality control of the results and made internal contributions. NG led 4CE visualization strategies and made contributions/edits to the manuscript. JGK contributed to the 4CE validation strategy and data submission strategies and made edits to the manuscript. KDM made contributions to the text and framework and made edits to the manuscript. DM was involved in data extraction and transformation to 4CE format. SNM led 4CE data validation strategies and made contributions/edits to the manuscript. GSO made contributions to strategy and edits to the manuscript. NP contributed to 4CE data analysis, aggregation, and quality control. KBW contributed to validation strategies and made edits to the manuscript. BJA, PA, BKB-J, RB, RLB, GAB, MC, MG, AG-S, DAH, JHH, CH, NHW, YL, JHM, AN, KYN, LPP, MP-J, PS, AMS, ALMT, DMT, BMT, CT, AKV, and GMW made contributions/edits to the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>RB and AM are shareholders of Biomeris srl. GSO is affiliated with BoD, Galectin Therapeutics, Angion Biomedica, and Amesite, Inc. DMT consulted on a legal matter for AstraZeneca last year.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mehra</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Ruschitzka</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>AN</given-names>
            </name>
          </person-group>
          <article-title>RETRACTED: Hydroxychloroquine or chloroquine with or without a macrolide for treatment of COVID-19: a multinational registry analysis</article-title>
          <source>The Lancet</source>
          <year>2020</year>
          <month>5</month>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://paperpile.com/b/TYeqxu/S6c6n"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(20)31180-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mehra</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Desai</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Kuy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Henry</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>AN</given-names>
            </name>
          </person-group>
          <article-title>Cardiovascular Disease, Drug Therapy, and Mortality in Covid-19</article-title>
          <source>N Engl J Med</source>
          <year>2020</year>
          <month>06</month>
          <day>18</day>
          <volume>382</volume>
          <issue>25</issue>
          <fpage>e102</fpage>
          <pub-id pub-id-type="doi">10.1056/nejmoa2007621</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cox</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Donnelly</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <source>Principles of Applied Statistics</source>
          <year>2011</year>
          <publisher-loc>Cambridge, UK</publisher-loc>
          <publisher-name>Cambridge University Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eriksson</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Byrne</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Johansson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Trygg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vikström</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <source>Multi- and Megavariate Data Analysis Basic Principles and Applications</source>
          <year>2013</year>
          <publisher-loc>Malmo, Sweden</publisher-loc>
          <publisher-name>Umetrics Academy</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Benchimol</surname>
              <given-names>EI</given-names>
            </name>
            <name name-style="western">
              <surname>Smeeth</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Guttmann</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Harron</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Petersen</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Sørensen</surname>
              <given-names>Henrik T</given-names>
            </name>
            <name name-style="western">
              <surname>von Elm</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Langan</surname>
              <given-names>SM</given-names>
            </name>
            <collab>RECORD Working Committee</collab>
          </person-group>
          <article-title>The REporting of studies Conducted using Observational Routinely-collected health Data (RECORD) statement</article-title>
          <source>PLoS Med</source>
          <year>2015</year>
          <month>10</month>
          <day>6</day>
          <volume>12</volume>
          <issue>10</issue>
          <fpage>e1001885</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pmed.1001885"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pmed.1001885</pub-id>
          <pub-id pub-id-type="medline">26440803</pub-id>
          <pub-id pub-id-type="pii">PMEDICINE-D-15-00711</pub-id>
          <pub-id pub-id-type="pmcid">PMC4595218</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Langan</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Wing</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ehrenstein</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Nicholls</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Filion</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Klungel</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Petersen</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Sorensen</surname>
              <given-names>HT</given-names>
            </name>
            <name name-style="western">
              <surname>Dixon</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Guttmann</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Harron</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hemkens</surname>
              <given-names>LG</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Schneeweiss</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Smeeth</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sturkenboom</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>von Elm</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Benchimol</surname>
              <given-names>EI</given-names>
            </name>
          </person-group>
          <article-title>The reporting of studies conducted using observational routinely collected health data statement for pharmacoepidemiology (RECORD-PE)</article-title>
          <source>BMJ</source>
          <year>2018</year>
          <month>11</month>
          <day>14</day>
          <volume>363</volume>
          <fpage>k3532</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/lookup/pmidlookup?view=long&#38;pmid=30429167"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.k3532</pub-id>
          <pub-id pub-id-type="medline">30429167</pub-id>
          <pub-id pub-id-type="pmcid">PMC6234471</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hersh</surname>
              <given-names>WR</given-names>
            </name>
            <name name-style="western">
              <surname>Weiner</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Embi</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Logan</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Payne</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstam</surname>
              <given-names>EV</given-names>
            </name>
            <name name-style="western">
              <surname>Lehmann</surname>
              <given-names>HP</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hartzog</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Cimino</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Saltz</surname>
              <given-names>JH</given-names>
            </name>
          </person-group>
          <article-title>Caveats for the Use of Operational Electronic Health Record Data in Comparative Effectiveness Research</article-title>
          <source>Medical Care</source>
          <year>2013</year>
          <volume>51</volume>
          <fpage>S30</fpage>
          <lpage>S37</lpage>
          <pub-id pub-id-type="doi">10.1097/mlr.0b013e31829b1dbd</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Verheij</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Curcin</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Delaney</surname>
              <given-names>BC</given-names>
            </name>
            <name name-style="western">
              <surname>McGilchrist</surname>
              <given-names>MM</given-names>
            </name>
          </person-group>
          <article-title>Possible Sources of Bias in Primary Care Electronic Health Record Data Use and Reuse</article-title>
          <source>J Med Internet Res</source>
          <year>2018</year>
          <month>05</month>
          <day>29</day>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>e185</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2018/5/e185/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.9134</pub-id>
          <pub-id pub-id-type="medline">29844010</pub-id>
          <pub-id pub-id-type="pii">v20i5e185</pub-id>
          <pub-id pub-id-type="pmcid">PMC5997930</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kahn</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Callahan</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Barnard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bauck</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Davidson</surname>
              <given-names>BN</given-names>
            </name>
            <name name-style="western">
              <surname>Estiri</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Goerg</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Holve</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Liaw</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hamilton-Lopez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Meeker</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zozus</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Schilling</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>A Harmonized Data Quality Assessment Terminology and Framework for the Secondary Use of Electronic Health Record Data</article-title>
          <source>EGEMS (Wash DC)</source>
          <year>2016</year>
          <month>09</month>
          <day>11</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>1244</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27713905"/>
          </comment>
          <pub-id pub-id-type="doi">10.13063/2327-9214.1244</pub-id>
          <pub-id pub-id-type="medline">27713905</pub-id>
          <pub-id pub-id-type="pii">egems1244</pub-id>
          <pub-id pub-id-type="pmcid">PMC5051581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weiskopf</surname>
              <given-names>NG</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Methods and dimensions of electronic health record data quality assessment: enabling reuse for clinical research</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2013</year>
          <month>01</month>
          <day>01</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>144</fpage>
          <lpage>51</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22733976"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000681</pub-id>
          <pub-id pub-id-type="medline">22733976</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000681</pub-id>
          <pub-id pub-id-type="pmcid">PMC3555312</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Casey</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>WF</given-names>
            </name>
            <name name-style="western">
              <surname>Adler</surname>
              <given-names>NE</given-names>
            </name>
          </person-group>
          <article-title>Using Electronic Health Records for Population Health Research: A Review of Methods and Applications</article-title>
          <source>Annu Rev Public Health</source>
          <year>2016</year>
          <month>03</month>
          <day>18</day>
          <volume>37</volume>
          <issue>1</issue>
          <fpage>61</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26667605"/>
          </comment>
          <pub-id pub-id-type="doi">10.1146/annurev-publhealth-032315-021353</pub-id>
          <pub-id pub-id-type="medline">26667605</pub-id>
          <pub-id pub-id-type="pmcid">PMC6724703</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Capocaccia</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>De Angelis</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Estimating the completeness of prevalence based on cancer registry data</article-title>
          <source>Statist Med</source>
          <year>1997</year>
          <month>02</month>
          <day>28</day>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>425</fpage>
          <lpage>440</lpage>
          <pub-id pub-id-type="doi">10.1002/(sici)1097-0258(19970228)16:4&#60;425::aid-sim414&#62;3.0.co;2-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smirnov</surname>
              <given-names>VB</given-names>
            </name>
          </person-group>
          <article-title>Earthquake catalogs: Evaluation of data completeness</article-title>
          <source>Volc Seis</source>
          <year>1998</year>
          <volume>19</volume>
          <fpage>497</fpage>
          <lpage>510</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchgate.net/publication/288555243_Earthquake_catalogs_Evaluation_of_data_completeness"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
          <article-title>Methods for De-identification of PHI</article-title>
          <source>Office for Civil Rights</source>
          <year>2015</year>
          <month>11</month>
          <day>6</day>
          <access-date>2020-06-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.hhs.gov/hipaa/for-professionals/privacy/special-topics/de-identification/index.html">https://www.hhs.gov/hipaa/for-professionals/privacy/special-topics/de-identification/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kirby</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Speltz</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rasmussen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Basford</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gottesman</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Peissig</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pacheco</surname>
              <given-names>Jennifer A</given-names>
            </name>
            <name name-style="western">
              <surname>Tromp</surname>
              <given-names>Gerard</given-names>
            </name>
            <name name-style="western">
              <surname>Pathak</surname>
              <given-names>Jyotishman</given-names>
            </name>
            <name name-style="western">
              <surname>Carrell</surname>
              <given-names>David S</given-names>
            </name>
            <name name-style="western">
              <surname>Ellis</surname>
              <given-names>Stephen B</given-names>
            </name>
            <name name-style="western">
              <surname>Lingren</surname>
              <given-names>Todd</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>Will K</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>Guergana</given-names>
            </name>
            <name name-style="western">
              <surname>Haines</surname>
              <given-names>Jonathan</given-names>
            </name>
            <name name-style="western">
              <surname>Roden</surname>
              <given-names>Dan M</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>Paul A</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>Joshua C</given-names>
            </name>
          </person-group>
          <article-title>PheKB: a catalog and workflow for creating electronic phenotype algorithms for transportability</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2016</year>
          <month>11</month>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>1046</fpage>
          <lpage>1052</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27026615"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocv202</pub-id>
          <pub-id pub-id-type="medline">27026615</pub-id>
          <pub-id pub-id-type="pii">ocv202</pub-id>
          <pub-id pub-id-type="pmcid">PMC5070514</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Can</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>PMR</given-names>
            </name>
            <name name-style="western">
              <surname>Mukundan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Castro</surname>
              <given-names>VM</given-names>
            </name>
            <name name-style="western">
              <surname>Dligach</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Finan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gainer</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Shadick</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>ST</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Age and morphology of posterior communicating artery aneurysms</article-title>
          <source>Sci Rep</source>
          <year>2020</year>
          <month>07</month>
          <day>14</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>11545</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-020-68276-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-020-68276-9</pub-id>
          <pub-id pub-id-type="medline">32665589</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-020-68276-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC7360743</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ananthakrishnan</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Cagan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gainer</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Churchill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Karlson</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>KP</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Statin Use Is Associated With Reduced Risk of Colorectal Cancer in Patients With Inflammatory Bowel Diseases</article-title>
          <source>Clin Gastroenterol Hepatol</source>
          <year>2016</year>
          <month>07</month>
          <volume>14</volume>
          <issue>7</issue>
          <fpage>973</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26905907"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cgh.2016.02.017</pub-id>
          <pub-id pub-id-type="medline">26905907</pub-id>
          <pub-id pub-id-type="pii">S1542-3565(16)00165-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC4912917</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Uno</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ritzwoller</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Cronin</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Hornbrook</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Hassett</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Determining the Time of Cancer Recurrence Using Claims or Electronic Medical Record Data</article-title>
          <source>JCO Clinical Cancer Informatics</source>
          <year>2018</year>
          <month>12</month>
          <issue>2</issue>
          <fpage>1</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.1200/cci.17.00163</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xiong</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Temporal Phenotyping from Longitudinal Electronic Health Records: A Graph Based Framework</article-title>
          <year>2015</year>
          <conf-name>KDD '15: Proceedings of the 21th ACM SIGKDD International Conference on Knowledge Discovery and Data</conf-name>
          <conf-date>August 2015</conf-date>
          <conf-loc>Sydney, NSW, Australia</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>Association for Computing Machinery</publisher-name>
          <fpage>705</fpage>
          <lpage>714</lpage>
          <pub-id pub-id-type="doi">10.1145/2783258.2783352</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brat</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Weber</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gehlenborg</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Avillach</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Palmer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chiovato</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cimino</surname>
              <given-names>James</given-names>
            </name>
            <name name-style="western">
              <surname>Waitman</surname>
              <given-names>Lemuel R</given-names>
            </name>
            <name name-style="western">
              <surname>Omenn</surname>
              <given-names>Gilbert S</given-names>
            </name>
            <name name-style="western">
              <surname>Malovini</surname>
              <given-names>Alberto</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>Jason H</given-names>
            </name>
            <name name-style="western">
              <surname>Beaulieu-Jones</surname>
              <given-names>Brett K</given-names>
            </name>
            <name name-style="western">
              <surname>Tibollo</surname>
              <given-names>Valentina</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>Shawn N</given-names>
            </name>
            <name name-style="western">
              <surname>Yi</surname>
              <given-names>Sehi L'</given-names>
            </name>
            <name name-style="western">
              <surname>Keller</surname>
              <given-names>Mark S</given-names>
            </name>
            <name name-style="western">
              <surname>Bellazzi</surname>
              <given-names>Riccardo</given-names>
            </name>
            <name name-style="western">
              <surname>Hanauer</surname>
              <given-names>David A</given-names>
            </name>
            <name name-style="western">
              <surname>Serret-Larmande</surname>
              <given-names>Arnaud</given-names>
            </name>
            <name name-style="western">
              <surname>Gutierrez-Sacristan</surname>
              <given-names>Alba</given-names>
            </name>
            <name name-style="western">
              <surname>Holmes</surname>
              <given-names>John J</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>Douglas S</given-names>
            </name>
            <name name-style="western">
              <surname>Mandl</surname>
              <given-names>Kenneth D</given-names>
            </name>
            <name name-style="western">
              <surname>Follett</surname>
              <given-names>Robert W</given-names>
            </name>
            <name name-style="western">
              <surname>Klann</surname>
              <given-names>Jeffrey G</given-names>
            </name>
            <name name-style="western">
              <surname>Murad</surname>
              <given-names>Douglas A</given-names>
            </name>
            <name name-style="western">
              <surname>Scudeller</surname>
              <given-names>Luigia</given-names>
            </name>
            <name name-style="western">
              <surname>Bucalo</surname>
              <given-names>Mauro</given-names>
            </name>
            <name name-style="western">
              <surname>Kirchoff</surname>
              <given-names>Katie</given-names>
            </name>
            <name name-style="western">
              <surname>Craig</surname>
              <given-names>Jean</given-names>
            </name>
            <name name-style="western">
              <surname>Obeid</surname>
              <given-names>Jihad</given-names>
            </name>
            <name name-style="western">
              <surname>Jouhet</surname>
              <given-names>Vianney</given-names>
            </name>
            <name name-style="western">
              <surname>Griffier</surname>
              <given-names>Romain</given-names>
            </name>
            <name name-style="western">
              <surname>Cossin</surname>
              <given-names>Sebastien</given-names>
            </name>
            <name name-style="western">
              <surname>Moal</surname>
              <given-names>Bertrand</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>Lav P</given-names>
            </name>
            <name name-style="western">
              <surname>Bellasi</surname>
              <given-names>Antonio</given-names>
            </name>
            <name name-style="western">
              <surname>Prokosch</surname>
              <given-names>Hans U</given-names>
            </name>
            <name name-style="western">
              <surname>Kraska</surname>
              <given-names>Detlef</given-names>
            </name>
            <name name-style="western">
              <surname>Sliz</surname>
              <given-names>Piotr</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>Amelia L M</given-names>
            </name>
            <name name-style="western">
              <surname>Ngiam</surname>
              <given-names>Kee Yuan</given-names>
            </name>
            <name name-style="western">
              <surname>Zambelli</surname>
              <given-names>Alberto</given-names>
            </name>
            <name name-style="western">
              <surname>Mowery</surname>
              <given-names>Danielle L</given-names>
            </name>
            <name name-style="western">
              <surname>Schiver</surname>
              <given-names>Emily</given-names>
            </name>
            <name name-style="western">
              <surname>Devkota</surname>
              <given-names>Batsal</given-names>
            </name>
            <name name-style="western">
              <surname>Bradford</surname>
              <given-names>Robert L</given-names>
            </name>
            <name name-style="western">
              <surname>Daniar</surname>
              <given-names>Mohamad</given-names>
            </name>
            <name name-style="western">
              <surname>Daniel</surname>
              <given-names>Christel</given-names>
            </name>
            <name name-style="western">
              <surname>Benoit</surname>
              <given-names>Vincent</given-names>
            </name>
            <name name-style="western">
              <surname>Bey</surname>
              <given-names>Romain</given-names>
            </name>
            <name name-style="western">
              <surname>Paris</surname>
              <given-names>Nicolas</given-names>
            </name>
            <name name-style="western">
              <surname>Serre</surname>
              <given-names>Patricia</given-names>
            </name>
            <name name-style="western">
              <surname>Orlova</surname>
              <given-names>Nina</given-names>
            </name>
            <name name-style="western">
              <surname>Dubiel</surname>
              <given-names>Julien</given-names>
            </name>
            <name name-style="western">
              <surname>Hilka</surname>
              <given-names>Martin</given-names>
            </name>
            <name name-style="western">
              <surname>Jannot</surname>
              <given-names>Anne Sophie</given-names>
            </name>
            <name name-style="western">
              <surname>Breant</surname>
              <given-names>Stephane</given-names>
            </name>
            <name name-style="western">
              <surname>Leblanc</surname>
              <given-names>Judith</given-names>
            </name>
            <name name-style="western">
              <surname>Griffon</surname>
              <given-names>Nicolas</given-names>
            </name>
            <name name-style="western">
              <surname>Burgun</surname>
              <given-names>Anita</given-names>
            </name>
            <name name-style="western">
              <surname>Bernaux</surname>
              <given-names>Melodie</given-names>
            </name>
            <name name-style="western">
              <surname>Sandrin</surname>
              <given-names>Arnaud</given-names>
            </name>
            <name name-style="western">
              <surname>Salamanca</surname>
              <given-names>Elisa</given-names>
            </name>
            <name name-style="western">
              <surname>Cormont</surname>
              <given-names>Sylvie</given-names>
            </name>
            <name name-style="western">
              <surname>Ganslandt</surname>
              <given-names>Thomas</given-names>
            </name>
            <name name-style="western">
              <surname>Gradinger</surname>
              <given-names>Tobias</given-names>
            </name>
            <name name-style="western">
              <surname>Champ</surname>
              <given-names>Julien</given-names>
            </name>
            <name name-style="western">
              <surname>Boeker</surname>
              <given-names>Martin</given-names>
            </name>
            <name name-style="western">
              <surname>Martel</surname>
              <given-names>Patricia</given-names>
            </name>
            <name name-style="western">
              <surname>Esteve</surname>
              <given-names>Loic</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>Alexandre</given-names>
            </name>
            <name name-style="western">
              <surname>Grisel</surname>
              <given-names>Olivier</given-names>
            </name>
            <name name-style="western">
              <surname>Leprovost</surname>
              <given-names>Damien</given-names>
            </name>
            <name name-style="western">
              <surname>Moreau</surname>
              <given-names>Thomas</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>Gael</given-names>
            </name>
            <name name-style="western">
              <surname>Vie</surname>
              <given-names>Jill-Jênn</given-names>
            </name>
            <name name-style="western">
              <surname>Wassermann</surname>
              <given-names>Demian</given-names>
            </name>
            <name name-style="western">
              <surname>Mensch</surname>
              <given-names>Arthur</given-names>
            </name>
            <name name-style="western">
              <surname>Caucheteux</surname>
              <given-names>Charlotte</given-names>
            </name>
            <name name-style="western">
              <surname>Haverkamp</surname>
              <given-names>Christian</given-names>
            </name>
            <name name-style="western">
              <surname>Lemaitre</surname>
              <given-names>Guillaume</given-names>
            </name>
            <name name-style="western">
              <surname>Bosari</surname>
              <given-names>Silvano</given-names>
            </name>
            <name name-style="western">
              <surname>Krantz</surname>
              <given-names>Ian D</given-names>
            </name>
            <name name-style="western">
              <surname>South</surname>
              <given-names>Andrew</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>Tianxi</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>Isaac S</given-names>
            </name>
          </person-group>
          <article-title>International electronic health record-derived COVID-19 clinical course profiles: the 4CE consortium</article-title>
          <source>NPJ Digit Med</source>
          <year>2020</year>
          <volume>3</volume>
          <fpage>109</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-020-00308-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-020-00308-0</pub-id>
          <pub-id pub-id-type="medline">32864472</pub-id>
          <pub-id pub-id-type="pii">308</pub-id>
          <pub-id pub-id-type="pmcid">PMC7438496</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Klann</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Abend</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Raghavan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Mandl</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Data interchange using i2b2</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2016</year>
          <month>09</month>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>909</fpage>
          <lpage>15</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26911824"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocv188</pub-id>
          <pub-id pub-id-type="medline">26911824</pub-id>
          <pub-id pub-id-type="pii">ocv188</pub-id>
          <pub-id pub-id-type="pmcid">PMC4997035</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ananthakrishnan</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Perez</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Gainer</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Churchill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Karlson</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Plenge</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>KP</given-names>
            </name>
          </person-group>
          <article-title>Improving Case Definition of Crohnʼs Disease and Ulcerative Colitis in Electronic Medical Records Using Natural Language Processing</article-title>
          <source>Inflammatory Bowel Diseases</source>
          <year>2013</year>
          <volume>19</volume>
          <issue>7</issue>
          <fpage>1411</fpage>
          <lpage>1420</lpage>
          <pub-id pub-id-type="doi">10.1097/mib.0b013e31828133fd</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ning</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Beam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Geva</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mullen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mandl</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Feature extraction for phenotyping from semantic and knowledge resources</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <month>03</month>
          <volume>91</volume>
          <fpage>103122</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30040-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103122</pub-id>
          <pub-id pub-id-type="medline">30738949</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30040-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC6424621</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ananthakrishnan</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Gainer</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Castro</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Link</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Honerlaw</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gagnon</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Karlson</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Plenge</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Churchill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>O'Donnell</surname>
              <given-names>Christopher</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Gaziano</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>KP</given-names>
            </name>
          </person-group>
          <article-title>High-throughput phenotyping with electronic medical record data using a common semi-supervised approach (PheCAP)</article-title>
          <source>Nat Protoc</source>
          <year>2019</year>
          <month>12</month>
          <day>20</day>
          <volume>14</volume>
          <issue>12</issue>
          <fpage>3426</fpage>
          <lpage>3444</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31748751"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41596-019-0227-6</pub-id>
          <pub-id pub-id-type="medline">31748751</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41596-019-0227-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7323894</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Karlson</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Gelaye</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Finan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Avillach</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Smoller</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Screening pregnant women for suicidal behavior in electronic medical records: diagnostic codes vs. clinical notes processed by natural language processing</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2018</year>
          <month>05</month>
          <day>29</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>30</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-018-0617-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-018-0617-7</pub-id>
          <pub-id pub-id-type="medline">29843698</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-018-0617-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC5975502</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Morin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Urban</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>PD</given-names>
            </name>
            <name name-style="western">
              <surname>Foster</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Sali</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sliz</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Research priorities. Shining light into black boxes</article-title>
          <source>Science</source>
          <year>2012</year>
          <month>04</month>
          <day>13</day>
          <volume>336</volume>
          <issue>6078</issue>
          <fpage>159</fpage>
          <lpage>60</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22499926"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/science.1218263</pub-id>
          <pub-id pub-id-type="medline">22499926</pub-id>
          <pub-id pub-id-type="pii">336/6078/159</pub-id>
          <pub-id pub-id-type="pmcid">PMC4203337</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beaulieu-Jones</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>CS</given-names>
            </name>
          </person-group>
          <article-title>Reproducibility of computational workflows is automated using continuous analysis</article-title>
          <source>Nat Biotechnol</source>
          <year>2017</year>
          <month>04</month>
          <day>13</day>
          <volume>35</volume>
          <issue>4</issue>
          <fpage>342</fpage>
          <lpage>346</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28288103"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/nbt.3780</pub-id>
          <pub-id pub-id-type="medline">28288103</pub-id>
          <pub-id pub-id-type="pii">nbt.3780</pub-id>
          <pub-id pub-id-type="pmcid">PMC6103790</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>KP</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Savova</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Karlson</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Ananthakrishnan</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Gainer</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Churchill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Development of phenotype algorithms using electronic medical records and incorporating natural language processing</article-title>
          <source>BMJ</source>
          <year>2015</year>
          <month>04</month>
          <day>24</day>
          <volume>350</volume>
          <issue>apr24 11</issue>
          <fpage>h1885</fpage>
          <lpage>h1885</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25911572"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.h1885</pub-id>
          <pub-id pub-id-type="medline">25911572</pub-id>
          <pub-id pub-id-type="pmcid">PMC4707569</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Geissbuhler</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Safran</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Buchan</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Bellazzi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Labkoff</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Eilenberg</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Leese</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Richardson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mantas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>De Moor</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Trustworthy reuse of health data: a transnational perspective</article-title>
          <source>Int J Med Inform</source>
          <year>2013</year>
          <month>01</month>
          <volume>82</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2012.11.003</pub-id>
          <pub-id pub-id-type="medline">23182430</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(12)00202-X</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
