<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v25i1e43153</article-id>
      <article-id pub-id-type="pmid">37093636</article-id>
      <article-id pub-id-type="doi">10.2196/43153</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Natural Language Processing in a Clinical Decision Support System for the Identification of Venous Thromboembolism: Algorithm Development and Validation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Leung</surname>
            <given-names>Tiffany</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Baker</surname>
            <given-names>Jannah</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Han</surname>
            <given-names>Peijin</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Jin</surname>
            <given-names>Zhi-Geng</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2971-6697</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Hui</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1942-2513</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Tai</surname>
            <given-names>Mei-Hui</given-names>
          </name>
          <degrees>MM</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0909-6040</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Ying</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1197-6941</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Yao</surname>
            <given-names>Yuan</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9426-4415</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Guo</surname>
            <given-names>Yu-Tao</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Pulmonary Vascular and Thrombotic Disease</institution>
            <institution>Sixth Medical Center of Chinese People's Liberation Army General Hospital</institution>
            <addr-line>No. 6 Fucheng Road</addr-line>
            <addr-line>Haidian District</addr-line>
            <addr-line>Beijing, 100048</addr-line>
            <country>China</country>
            <phone>86 01066958581</phone>
            <email>dor_guoyt@hotmail.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7626-7751</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Pulmonary Vascular and Thrombotic Disease</institution>
        <institution>Sixth Medical Center of Chinese People's Liberation Army General Hospital</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Chinese People's Liberation Army Medical School</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Quality Management Division</institution>
        <institution>Sixth Medical Center of Chinese People's Liberation Army General Hospital</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Institute for Hospital Management Research</institution>
        <institution>Chinese People's Liberation Army General Hospital</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Yu-Tao Guo <email>dor_guoyt@hotmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>24</day>
        <month>4</month>
        <year>2023</year>
      </pub-date>
      <volume>25</volume>
      <elocation-id>e43153</elocation-id>
      <history>
        <date date-type="received">
          <day>1</day>
          <month>10</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>4</day>
          <month>11</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>20</day>
          <month>11</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>29</day>
          <month>3</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Zhi-Geng Jin, Hui Zhang, Mei-Hui Tai, Ying Yang, Yuan Yao, Yu-Tao Guo. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 24.04.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2023/1/e43153" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>It remains unknown whether capturing data from electronic health records (EHRs) using natural language processing (NLP) can improve venous thromboembolism (VTE) detection in different clinical settings.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to validate the NLP algorithm in a clinical decision support system for VTE risk assessment and integrated care (DeVTEcare) to identify VTEs from EHRs.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>All inpatients aged ≥18 years in the Sixth Medical Center of the Chinese People's Liberation Army General Hospital from January 1 to December 31, 2021, were included as the validation cohort. The sensitivity, specificity, positive and negative likelihood ratios (LR+ and LR–, respectively), area under the receiver operating characteristic curve (AUC), and F1-scores along with their 95% CIs were used to analyze the performance of the NLP tool, with manual review of medical records as the reference standard for detecting deep vein thrombosis (DVT) and pulmonary embolism (PE). The primary end point was the performance of the NLP approach embedded into the EHR for VTE identification. The secondary end points were the performances to identify VTE among different hospital departments with different VTE risks. Subgroup analyses were performed among age, sex, and the study season.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Among 30,152 patients (median age 56 [IQR 41-67] years; 14,247/30,152, 47.3% females), the prevalence of VTE, PE, and DVT was 2.1% (626/30,152), 0.6% (177/30,152), and 1.8% (532/30,152), respectively. The sensitivity, specificity, LR+, LR–, AUC, and F1-score of NLP-facilitated VTE detection were 89.9% (95% CI 87.3%-92.2%), 99.8% (95% CI 99.8%-99.9%), 483 (95% CI 370-629), 0.10 (95% CI 0.08-0.13), 0.95 (95% CI 0.94-0.96), and 0.90 (95% CI 0.90-0.91), respectively. Among departments of surgery, internal medicine, and intensive care units, the highest specificity (100% vs 99.7% vs 98.8%, respectively), LR+ (3202 vs 321 vs 77, respectively), and F1-score (0.95 vs 0.89 vs 0.92, respectively) were in the surgery department (all <italic>P</italic>&#60;.001). Among low, intermediate, and high VTE risks in hospital departments, the low-risk department had the highest AUC (1.00 vs 0.94 vs 0.96, respectively) and F1-score (0.97 vs 0.90 vs 0.90, respectively) as well as the lowest LR– (0.00 vs 0.13 vs 0.08, respectively) (DeLong test for AUC; all <italic>P</italic>&#60;.001). Subgroup analysis of the age, sex, and season demonstrated consistently good performance of VTE detection with &#62;87% sensitivity and specificity and &#62;89% AUC and F1-score. The NLP algorithm performed better among patients aged ≤65 years than among those aged &#62;65 years (F1-score 0.93 vs 0.89, respectively; <italic>P</italic>&#60;.001).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The NLP algorithm in our DeVTEcare identified VTE well across different clinical settings, especially in patients in surgery units, departments with low-risk VTE, and patients aged ≤65 years. This algorithm can help to inform accurate in-hospital VTE rates and enhance risk-classified VTE integrated care in future research.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>venous thromboembolism</kwd>
        <kwd>deep vein thrombosis</kwd>
        <kwd>pulmonary embolism</kwd>
        <kwd>natural language processing</kwd>
        <kwd>electronic health record</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Venous thromboembolism (VTE), which includes deep vein thrombosis (DVT) and pulmonary embolism (PE), is a leading cause of death and disability worldwide [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Studies have shown that the prevalence of VTE has substantially increased worldwide [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref4">4</xref>]. Up to 60% of VTE cases occur during or after hospitalization, making it a leading preventable cause of hospital death [<xref ref-type="bibr" rid="ref5">5</xref>]. The detection of VTE among hospitalized patients informs decision-making surrounding VTE risk and thrombosis risk mitigation. However, doctors and nurses may not be aware of the risk of VTE, which in turn leads to lack of adherence with the clinical practice guidelines for patients with VTE, given the complex clinical setting [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. To ensure that best practices are reliably delivered, some quality and safety indicators for VTE prevention and management have been adopted as measures of hospital performance and are utilized in several pay-for-performance programs [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Thus, accurate and timely identification of VTE from hospital clinical and administrative databases is crucial for assessing hospital care quality and for further enhancing improvements in care.</p>
      <p>Although manual medical record review is the gold standard for VTE event investigation, it is a time-consuming, labor-intensive, and costly process. The International Classiﬁcation of Diseases diagnosis codes are commonly used to monitor VTE incidence at each hospital, but they are unreliable to establish ground truth since they are prone to coding bias and have variable reported accuracy in identifying VTE [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref12">12</xref>]. Moreover, they are only available after discharge. The growing use of electronic health records (EHRs) has made it possible for health care providers to acquire an invaluable source of information for research and analysis. Recently, the natural language processing (NLP) method has been developed to embed into EHRs to flag the adverse outcomes [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. These technologies, which use corpus processing and automatic learning models from extracted EHR data, hold promise for reliably and efficiently identifying patients with VTE [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
      <p>Previous studies on the application of NLP tools for detecting VTE cases mainly utilized imaging reports, and the reported positive predictive values (PPVs) ranged from 54% to 100% [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. Nonetheless, besides imaging, more available data, including clinical text, laboratory values, and vital signs in EHRs, can be utilized for NLP to improve VTE detection. In addition, VTE prophylaxis is hospital-level management, and NLP-facilitated VTE detection should adapt to different clinical settings and help clinicians pay attention to VTE in the early stage.</p>
      <p>In this study, we describe an NLP algorithm in a clinical decision support system for VTE risk assessment and integrated care (DeVTEcare) that can timely recognize DVT and PE from different types of EHR data after their occurrence and we validated its performance of VTE detection in different clinical settings.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design and Population</title>
        <p>This retrospective observational study was conducted in the Sixth Medical Center of the Chinese People's Liberation Army General Hospital, which is a tertiary hospital that integrates medical care, teaching, and research. All inpatients aged ≥18 years admitted between January 1 and December 31, 2021, were included as the validation cohort. Hospitalized patients were excluded if they lacked diagnostic information or if their hospital stay was ≤24 hours. This study followed the Standards for Reporting Diagnostic accuracy studies (STARD) reporting guidelines (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) [<xref ref-type="bibr" rid="ref25">25</xref>].</p>
      </sec>
      <sec>
        <title>Ethics Approval</title>
        <p>This cohort study was approved by the medical ethics committee of the Sixth Medical Center of Chinese People's Liberation Army General Hospital (approval HZKY-PJ-2022-21). A waiver of informed consent was obtained because this was a retrospective data-only study. All data were deidentified.</p>
      </sec>
      <sec>
        <title>NLP Approach Development</title>
        <p>The rule-based NLP approach in DeVTEcare was embedded into the EHR to timely identify VTE based on the clinical text (admission notes, medical progress notes, surgical notes, discharge summaries, etc) and imaging reports. When a patient was admitted, DeVTEcare automatically assessed and flagged VTE risk, and then, the guideline-recommended VTE prophylaxis and treatments were further proposed at 5 time points: within 24 hours after admission, within 24 hours before and after operation, within 24 hours after transferring, and at discharge. Moreover, VTE risk assessment was automatically evaluated daily at midnight.</p>
        <p>The NLP system detected VTE in 3 steps: data acquisition, information extraction, and information aggregation (<xref rid="figure1" ref-type="fig">Figure 1</xref>). This system employs a set of highly optimized and configurable NLP components that enable quick and easy clinical information extraction and aggregation (<xref ref-type="table" rid="table1">Table 1</xref>). All relevant full-text documents from patients were retrieved from the EHR. First, the data acquisition module encapsulated patient data into the JSON format. Second, in the information extraction process, the location of extraction was determined by the location detector. The information for the discharge confirmation of patients with VTE was extracted from the patient’s imaging report, discharge summaries, medical progress notes, and surgical notes, while the information for the admission confirmation of patients with VTE was extracted from the patient’s admission notes. Then, the sentence segmenter was used to break up the sentence, the entity recognizer was used to identify the target concept, and the context detector was used to find the target concept’s occurrence time and negation relationship. Next, the sentence inferencer was used to derive the sentence conclusion, and the document inferencer was then utilized to generate the document conclusion. Third, in the information aggregation process, the convergence of various documented findings yielded “discharged with VTE” and “admission with VTE,” which were then further computed by expressions to yield the results for new-onset in-hospital VTE.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>The natural language processing tool inferencing workflow in the clinical decision support system for venous thromboembolism risk assessment and integrated care. EHR: electronic health record; VTE: venous thromboembolism.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e43153_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Components of the natural language processing tool in the clinical decision support system for venous thromboembolism risk assessment and integrated care.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="190"/>
            <col width="810"/>
            <thead>
              <tr valign="top">
                <td>Components</td>
                <td>Functionality description</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Location detector</td>
                <td>Identify information extraction locations such as present medical history, admission notes, medical progress notes, surgical notes, discharge summaries, and imaging reports</td>
              </tr>
              <tr valign="top">
                <td>Sentence segmenter</td>
                <td>Detect sentence boundaries</td>
              </tr>
              <tr valign="top">
                <td>Entity recognizer<sup>a</sup></td>
                <td>Identify target concepts such as deep vein thrombosis or pulmonary embolism</td>
              </tr>
              <tr valign="top">
                <td>Context detector</td>
                <td>Attach the context information as feature values to the corresponding target concepts such as present or historical, negated or affirmed</td>
              </tr>
              <tr valign="top">
                <td>Sentence inferencer</td>
                <td>Create sentence-level conclusions based on target concepts and corresponding context</td>
              </tr>
              <tr valign="top">
                <td>Document inferencer</td>
                <td>Create a document-level conclusion from the corresponding sentence-level conclusions</td>
              </tr>
              <tr valign="top">
                <td>Patient inferencer<sup>b</sup></td>
                <td>Aggregate document-level conclusions to infer patient-level conclusions</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>As an extension, the entity recognizer can not only extract named entity recognition from free text but also extract variables from structural data.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>For the patient inferencer part, we have expanded the syntax expression function to support arithmetic, logic, and set operations.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>To achieve these objectives, a VTE domain knowledge base was developed. We used disease definitions from the Chinese Guidelines for the Prevention and Treatment of Thrombophilia [<xref ref-type="bibr" rid="ref26">26</xref>], the National Clinical Version of Disease Classification and Coding 2.0 [<xref ref-type="bibr" rid="ref27">27</xref>], and the corresponding Chinese translations from the Unified Medical Language System from the National Library of Medicine. We also searched medical websites for corresponding synonyms to enrich the ontology concepts [<xref ref-type="bibr" rid="ref28">28</xref>]. The knowledge base was further improved by a research team involving 2 NLP programmers, 3 medical specialists in thrombosis, and 2 database administrators with a weekly working meeting. During the iterative training phase, a small proportion of real clinical cases was manually verified by the designated physicians on a weekly basis, the NLP programmer refined the recognition error of the rules iteratively for 8 weeks, and eventually, 200 randomly selected patients were tested. During the testing phase, additional 260 patients were randomly selected for testing by the physicians. After the test was complete, the NLP approach achieved 85.7% sensitivity and 93.5% specificity for detecting VTE. Then, the NLP programmer repeatedly refined the rules based on the test results and research team’s comments until all correctable faults were fixed. The keywords for the NLP algorithm are listed in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
      </sec>
      <sec>
        <title>Validation of the NLP Approach</title>
        <p>The NLP approach for VTE detection was validated in different clinical settings and in departments with different VTE risk statuses, as follows.</p>
        <list list-type="order">
          <list-item>
            <p>We stratified 43 inpatient departments in our hospital into surgery, internal medicine, and intensive care units.</p>
          </list-item>
          <list-item>
            <p>The number of VTE-related deaths was calculated between the years of 2011 and 2020.</p>
          </list-item>
        </list>
        <p>The departments were further classified as low, intermediate, and high risks for VTE if there were &#60;1, 1-5, &#62;5 VTE-related deaths per year, respectively. The performance of the NLP approach was also evaluated with regard to the type of VTE, that is, PE or DVT. Manual review of medical records was taken as the reference standard for detecting PE and DVT. When there was a disagreement between NLP identification and the clinical expert’s review, an advanced artificial intelligence engineer and a cardiologist audited the event.</p>
      </sec>
      <sec>
        <title>Study End Points</title>
        <p>The primary end point was the performance of the NLP approach in DeVTEcare embedded into the EHR for VTE identification. The secondary end points were the performances to identify VTE in different clinical settings and in departments with different VTE risk statuses.</p>
      </sec>
      <sec>
        <title>Clinical Events</title>
        <p>The diagnosis of VTE was confirmed on ultrasound doppler, computed tomography, or computed tomography pulmonary angiogram. The VTEs were classified as (1) on-admission VTE: new-onset VTE admitted to the hospital and (2) in-hospital VTE: new-onset VTE during hospitalization but without VTE on admission. Since this study primarily focused on DVT and PE, thrombosis in the upper extremity, internal jugular, and superior or inferior vena cava were not considered valid VTE. Patients with prior VTE were also deemed invalid.</p>
      </sec>
      <sec>
        <title>Statistical Analyses</title>
        <p>Continuous variables were expressed as median (IQR), while categorical variables were expressed as numbers and percentages. The sensitivity, specificity, PPV, negative predictive value (NPV), area under the receiver operating characteristic curve (AUC), and F1-score were used to evaluate the performance of the NLP approach for VTE detection, in relation to the type of VTE, different clinical settings, and in the low-, intermediate-, and high-risk departments. Subgroup analyses were performed among age (&#62;65 years or ≤65 years), sex (female or male), and the study season (first quarter, second quarter, third quarter, fourth quarter). Given that PPV might be affected by the prevalence of disease, positive and negative likelihood ratios (LR+ and LR–, respectively) were used to characterize the clinical utility of the test. The LR– CIs were obtained using a bootstrap method with 100% sensitivity [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
        <p>The chi-square test or Fisher exact test was applied for the comparisons of the categorical variables, if appropriate. DeLong test was used for comparing AUCs, and <italic>Z</italic> test was used for comparing the F1-scores. The relative diagnostic LR method was used for comparing the LRs of 2 diagnostic tests [<xref ref-type="bibr" rid="ref30">30</xref>]. The Bonferroni method was used to adjust for multiple comparisons. The agreement to the reference test and the interreviewer agreement were also assessed using Cohen κ test. A 2-sided <italic>P</italic>&#60;.01 was considered to be statistically signiﬁcant. All statistical analyses were carried out using the R software (version 4.2.1; R Core Team and the R Foundation for Statistical Computing).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Characteristics of the Patients</title>
        <p>A total of 30,152 patients were included from January 1 to December 31, 2021; the flow chart is shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>. The median patient age was 56 (IQR 41-67) years, and 47.3% (14,247/30,152) of the patients were females. Half of the patients were from internal medicine departments with moderate risk of VTE. The enrolled patients were almost equally distributed throughout the 4 quarters of the study year. The median length of hospital stay was 8 (IQR 5-12) days. The incidence of VTE confirmed by the clinical experts was 2.1% (626/30,152), with PE at 0.6% (177/30,152) and DVT at 1.8% (532/30,152). The detailed incidence of VTE is shown in <xref ref-type="table" rid="table2">Table 2</xref> and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>. Overall, the prevalence of VTE increased with the increasing VTE risk in the departments (high risk: 219/6769, 3.2%; intermediate risk: 358/15,368, 2.3%; low risk: 49/8015, 0.6%; <italic>P</italic>&#60;.001).</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Flowchart of the patient analysis in this study. The low, intermediate, and high risks of venous thromboembolism were defined by departments having &#60;1, 1-5, and &#62;5 venous thromboembolism–related deaths per year, respectively.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e43153_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Characteristics of the patients in this study.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="350"/>
            <col width="0"/>
            <col width="250"/>
            <col width="0"/>
            <col width="280"/>
            <col width="0"/>
            <col width="90"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Characteristics</td>
                <td colspan="2">Patients (N=30,152), n (%)</td>
                <td colspan="2">Venous thromboembolism events<sup>a</sup> (n=626), n (%)</td>
                <td><italic>P</italic> value<sup>b</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="7">
                  <bold>Age (years)</bold>
                </td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#62;65</td>
                <td colspan="2">8859 (29.4)</td>
                <td colspan="2">409 (4.6)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≤65</td>
                <td colspan="2">21,293 (70.6)</td>
                <td colspan="2">217 (1)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Sex</bold>
                </td>
                <td>.43</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td colspan="2">14,247 (47.3)</td>
                <td colspan="2">286 (2)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td colspan="2">15,905 (52.7)</td>
                <td colspan="2">340 (2.1)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Department</bold>
                </td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Surgery</td>
                <td colspan="2">13,589 (45.1)</td>
                <td colspan="2">77 (0.6)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Internal medicine</td>
                <td colspan="2">15,681 (52)</td>
                <td colspan="2">421 (2.7)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Intensive care unit</td>
                <td colspan="2">882 (2.9)</td>
                <td colspan="2">128 (14.5)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Venous thromboembolism risk<sup>c</sup></bold>
                </td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>High</td>
                <td colspan="2">6769 (22.4)</td>
                <td colspan="2">219 (3.2)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Intermediate</td>
                <td colspan="2">15,368 (51)</td>
                <td colspan="2">358 (2.3)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Low</td>
                <td colspan="2">8015 (26.6)</td>
                <td colspan="2">49 (0.6)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Quarter of the study year</bold>
                </td>
                <td>&#60;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>First quarter</td>
                <td colspan="2">5868 (19.5)</td>
                <td colspan="2">109 (1.9)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Second quarter</td>
                <td colspan="2">7616 (25.2)</td>
                <td colspan="2">128 (1.7)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Third quarter</td>
                <td colspan="2">8510 (28.2)</td>
                <td colspan="2">157 (1.8)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Fourth quarter</td>
                <td colspan="2">8158 (27.1)</td>
                <td colspan="2">232 (2.8)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Any venous thromboembolism event confirmed by clinical experts.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup><italic>P</italic> values for the comparison of venous thromboembolism events.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>The low, intermediate, and high venous thromboembolism risk was defined by departments having &#60;1, 1-5, and &#62;5 venous thromboembolism–related deaths per year, respectively.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>NLP Performance for VTE Detection</title>
        <p>In DeVTEcare, of the 626 events, 563 (89.9%) VTEs were detected by the NLP approach, achieving a sensitivity of 89.9%, specificity of 99.8%, PPV of 91.1%, NPV of 99.8%, LR+ of 483, LR– of 0.1, AUC of 0.95, and F1-score of 0.9. The NLP approach detected the on-admission and in-hospital VTE, with sensitivity ranging from 84.4% to 100%, specificity from 99.8% to 100%, PPV from 81% to 92.3%, NPV from 99.8% to 100%, LR+ from 550 to 7115, LR– from 0 to 0.16, AUC from 0.92 to 1.00, and F1-score from 0.87 to 0.94 (<xref ref-type="table" rid="table3">Table 3</xref>, <xref ref-type="table" rid="table4">Table 4</xref>, and <xref rid="figure3" ref-type="fig">Figure 3</xref>). However, NLP performed better in detecting PE than DVT for on-admission VTE (sensitivity 100% vs 84.4%, NPV 100% vs 99.8%, LR+ 1579 vs 739, LR– 0 vs 0.16, AUC 1.00 vs 0.92, F1-score 0.94 vs 0.87, respectively; DeLong test for AUC; all <italic>P&#60;</italic>.01), while much higher NPV (100% vs 99.9%, respectively; <italic>P&#60;</italic>.001) and lower F1-score (0.87 vs 0.90, respectively; <italic>P&#60;</italic>.001) were observed for in-hospital PE detection. No statistically significant differences in the other diagnostic parameters between PE and DVT for either on-admission or in-hospital detection were found (all <italic>P</italic>&#62;.01) (<xref ref-type="table" rid="table3">Table 3</xref>, <xref ref-type="table" rid="table4">Table 4</xref>, and <xref rid="figure3" ref-type="fig">Figure 3</xref>). DeVTEcare and the expert’s review agreed well for any type of VTE identification, with κ values ranging from 0.87 to 0.94 (<xref ref-type="table" rid="table4">Table 4</xref>). Interreviewer agreement for the diagnosis of VTE showed κ values of 0.90-1.00.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Likelihood ratios of the clinical decision support system for venous thromboembolism risk assessment and integrated care for identifying venous thromboembolism.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="320"/>
            <col width="0"/>
            <col width="320"/>
            <col width="0"/>
            <col width="330"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Venous thromboembolism type</td>
                <td colspan="2">Positive likelihood ratio (95% CI)</td>
                <td>Negative likelihood ratio (95% CI)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="6">
                  <bold>On-admission</bold>
                  <bold>venous thromboembolism</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pulmonary embolism</td>
                <td colspan="2">1579 (1007-2474)<sup>a</sup></td>
                <td colspan="2">0.00 (0.00-0.02)<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Deep vein thrombosis</td>
                <td colspan="2">739 (527-1037)</td>
                <td colspan="2">0.16 (0.12-0.20)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Venous thromboembolism</td>
                <td colspan="2">550 (414-731)</td>
                <td colspan="2">0.11 (0.08-0.14)</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>In-hospital</bold>
                  <bold>venous thromboembolism</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pulmonary embolism</td>
                <td colspan="2">7115 (2653-19,077)</td>
                <td colspan="2">0.06 (0.01-0.37)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Deep vein thrombosis</td>
                <td colspan="2">2042 (1183-3526)</td>
                <td colspan="2">0.11 (0.08-0.17)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Venous thromboembolism</td>
                <td colspan="2">1782 (1072-2962)</td>
                <td colspan="2">0.11 (0.07-0.16)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Any venous thromboembolism</td>
                <td colspan="2">483 (370-629)</td>
                <td colspan="2">0.10 (0.08-0.13)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Pulmonary embolism versus deep vein thrombosis; <italic>P=</italic>.008.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>Pulmonary embolism versus deep vein thrombosis; <italic>P&#60;</italic>.001.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Diagnostic statistics of the clinical decision support system for venous thromboembolism risk assessment and integrated care for identifying venous thromboembolism.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="400"/>
            <col width="0"/>
            <col width="190"/>
            <col width="0"/>
            <col width="190"/>
            <col width="0"/>
            <col width="190"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Venous thromboembolism type</td>
                <td colspan="2">Area under the curve<sup>a</sup> (95% CI)</td>
                <td colspan="2">F1-score<sup>b</sup> (95% CI)</td>
                <td>κ (95% CI)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="8">
                  <bold>On-admission</bold>
                  <bold>venous thromboembolism</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pulmonary embolism</td>
                <td colspan="2">1.00 (1.00-1.00)<sup>c</sup></td>
                <td colspan="2">0.94 (0.93-0.95)<sup>c</sup></td>
                <td colspan="2">0.94 (0.92-0.97)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Deep vein thrombosis</td>
                <td colspan="2">0.92 (0.90-0.94)</td>
                <td colspan="2">0.87 (0.86-0.88)</td>
                <td colspan="2">0.87 (0.84-0.90)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Venous thromboembolism</td>
                <td colspan="2">0.94 (0.93-0.96)</td>
                <td colspan="2">0.89 (0.88-0.90)</td>
                <td colspan="2">0.89 (0.87-0.91)</td>
              </tr>
              <tr valign="top">
                <td colspan="8">
                  <bold>In-hospital</bold>
                  <bold>venous thromboembolism</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pulmonary embolism</td>
                <td colspan="2">0.97 (0.92-1.00)</td>
                <td colspan="2">0.87 (0.83-0.91)</td>
                <td colspan="2">0.87 (0.76-0.98)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Deep vein thrombosis</td>
                <td colspan="2">0.94 (0.92-0.97)</td>
                <td colspan="2">0.90 (0.89-0.92)<sup>c</sup></td>
                <td colspan="2">0.90 (0.87-0.94)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Venous thromboembolism</td>
                <td colspan="2">0.95 (0.92-0.97)</td>
                <td colspan="2">0.90 (0.89-0.91)</td>
                <td colspan="2">0.90 (0.87-0.93)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Any venous thromboembolism</td>
                <td colspan="2">0.95 (0.94-0.96)</td>
                <td colspan="2">0.90 (0.90-0.91)</td>
                <td colspan="2">0.90 (0.89-0.92)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>DeLong test was used for comparing areas under the curve.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup><italic>Z</italic> test was used for comparing F1-scores.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>Pulmonary embolism versus deep vein thrombosis; <italic>P&#60;</italic>.001.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Performance of the clinical decision support system for venous thromboembolism risk assessment and integrated care for identifying venous thromboembolism. (A) Sensitivity and specificity. (B) Positive and negative predictive values. DVT: deep vein thrombosis; FN: false negative; FP: false positive; NPV: negative predictive value; PE: pulmonary embolism; PPV: positive predictive value; TN: true negative; TP: true positive; VTE: venous thromboembolism.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e43153_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>NLP Performance in Different Settings and VTE Risk</title>
        <p>Among the departments of surgery, internal medicine, and intensive care units, the highest specificity (100% vs 99.7% vs 98.8%, respectively), NPV (100% vs 99.7% vs 98.7%, respectively), LR+ (3202 vs 321 vs 77, respectively), and F1-score (0.95 vs 0.89 vs 0.92, respectively) of the NLP approach for VTE detection were in the surgery department (all <italic>P</italic>&#60;.001; Bonferroni adjusted <italic>P</italic>=.003). No statistically significant differences were found in sensitivity, PPV, LR–, and AUC (all <italic>P</italic>&#62;.01; Bonferroni adjusted <italic>P</italic>=.003) (<xref ref-type="table" rid="table5">Table 5</xref>, <xref ref-type="table" rid="table6">Table 6</xref>, and <xref rid="figure4" ref-type="fig">Figure 4</xref>).</p>
        <p>The NLP algorithm consistently detected VTE in low, intermediate, and high-risk departments with good sensitivity and specificity (sensitivity 100%, 87.4%, and 91.8%, respectively; specificity 100%, 99.8%, and 99.6%, respectively), although the difference of specificity between low- and high-risk departments was statistically significant (<italic>P</italic>&#60;.001; Bonferroni adjusted <italic>P</italic>=.003). Among low-, intermediate-, and high-risk departments, the low-risk department had the highest AUC (1.00 vs 0.94 vs 0.96, respectively), F1-score (0.97 vs 0.90 vs 0.90, respectively), NPV (100% vs 99.7% vs 99.7%, respectively), and the lowest LR– (0.00 vs 0.13 vs 0.08, respectively) (DeLong test for AUC, all <italic>P</italic>&#60;.001; Bonferroni adjusted <italic>P</italic>=.003). The highest LR+ was associated with the low-risk department as well (2655 vs 525 vs 223, respectively), but a statistically significant difference existed only between the low- and high-risk departments (<italic>P</italic>&#60;.001; Bonferroni adjusted <italic>P</italic>=.003) (<xref ref-type="table" rid="table5">Table 5</xref>, <xref ref-type="table" rid="table6">Table 6</xref>, and <xref rid="figure4" ref-type="fig">Figure 4</xref>). The error analysis of DeVTEcare in detecting VTE is shown in <xref ref-type="table" rid="table7">Table 7</xref>.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Likelihood ratios of the clinical decision support system for venous thromboembolism risk assessment and integrated care for identifying any venous thromboembolism according to different settings.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="380"/>
            <col width="0"/>
            <col width="300"/>
            <col width="0"/>
            <col width="290"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Setting</td>
                <td colspan="2">Positive likelihood ratio (95% CI)</td>
                <td>Negative likelihood ratio (95% CI)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="6">
                  <bold>Age (years)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#62;65</td>
                <td colspan="2">178 (132-242)</td>
                <td colspan="2">0.11 (0.09-0.15)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≤65</td>
                <td colspan="2">1494 (866-2576)<sup>a</sup></td>
                <td colspan="2">0.08 (0.05-0.12)</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Sex</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td colspan="2">744 (462-1198)</td>
                <td colspan="2">0.09 (0.07-0.13)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td colspan="2">366 (266-504)</td>
                <td colspan="2">0.11 (0.08-0.14)</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Department</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Surgery</td>
                <td colspan="2">3202 (1200-8543)<sup>b</sup></td>
                <td colspan="2">0.05 (0.02-0.13)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Internal medicine</td>
                <td colspan="2">321 (237-435)</td>
                <td colspan="2">0.12 (0.09-0.15)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Intensive care unit</td>
                <td colspan="2">77 (40-148)</td>
                <td colspan="2">0.08 (0.04-0.14)</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Venous thromboembolism risk by department<sup>c</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>High</td>
                <td colspan="2">223 (152-325)</td>
                <td colspan="2">0.08 (0.05-0.13)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Intermediate</td>
                <td colspan="2">525 (354-778)</td>
                <td colspan="2">0.13 (0.10-0.16)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Low</td>
                <td colspan="2">2655 (856-8231)<sup>d</sup></td>
                <td colspan="2">0.00 (0.00-0.06)</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Quarter of the study year</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>First quarter</td>
                <td colspan="2">732 (348-1539)</td>
                <td colspan="2">0.11 (0.06-0.19)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Second quarter</td>
                <td colspan="2">834 (416-1671)</td>
                <td colspan="2">0.11 (0.07-0.18)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Third quarter</td>
                <td colspan="2">687 (380-1242)</td>
                <td colspan="2">0.10 (0.06-0.15)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Fourth quarter</td>
                <td colspan="2">247 (171-357)</td>
                <td colspan="2">0.10 (0.06-0.14)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>≤65 years versus &#62;65 years; <italic>P&#60;</italic>.001.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>Surgery versus internal medicine or intensive care unit; <italic>P&#60;</italic>.001; Bonferroni adjusted <italic>P</italic>=.003.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>The low, intermediate, and high risk of venous thromboembolism was defined by departments having &#60;1, 1-5, and &#62;5 venous thromoboembolism–related deaths per year, respectively.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>Low versus high; <italic>P&#60;</italic>.001; Bonferroni adjusted <italic>P</italic>=.003.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Diagnostic statistics of the clinical decision support system for venous thromboembolism risk assessment and integrated care for identifying any venous thromboembolism according to different settings.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="240"/>
            <col width="0"/>
            <col width="270"/>
            <col width="0"/>
            <col width="230"/>
            <col width="230"/>
            <thead>
              <tr valign="bottom">
                <td colspan="3">Setting</td>
                <td colspan="2">Area under the curve<sup>a</sup> (95% CI)</td>
                <td>F1-score<sup>b</sup> (95% CI)</td>
                <td>κ (95% CI)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="7">
                  <bold>Age (years)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>&#62;65</td>
                <td colspan="2">0.94 (0.93-0.96)</td>
                <td colspan="2">0.89 (0.88-0.90)</td>
                <td>0.92 (0.88-0.95)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>≤65</td>
                <td colspan="2">0.96 (0.94-0.98)</td>
                <td colspan="2">0.93 (0.92-0.94)<sup>c</sup></td>
                <td>0.98 (0.96-0.99)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Sex</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td colspan="2">0.95 (0.93-0.97)</td>
                <td colspan="2">0.92 (0.91-0.93)<sup>d</sup></td>
                <td>0.92 (0.90-0.94)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td colspan="2">0.95 (0.93-0.96)</td>
                <td colspan="2">0.89 (0.88-0.90)</td>
                <td>0.89 (0.87-0.91)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Department</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Surgery</td>
                <td colspan="2">0.97 (0.95-1.00)</td>
                <td colspan="2">0.95 (0.94-0.96)<sup>e</sup></td>
                <td>0.95 (0.93-0.96)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Internal medicine</td>
                <td colspan="2">0.94 (0.92-0.96)</td>
                <td colspan="2">0.89 (0.88-0.90)</td>
                <td>0.89 (0.87-0.91)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Intensive care unit</td>
                <td colspan="2">0.95 (0.93-0.98)</td>
                <td colspan="2">0.92 (0.91-0.94)</td>
                <td>0.91 (0.90-0.93)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Venous thromboembolism risk by department<sup>f</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>High</td>
                <td colspan="2">0.96 (0.94-0.97)</td>
                <td colspan="2">0.90 (0.89-0.91)</td>
                <td>0.90 (0.88-0.91)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Intermediate</td>
                <td colspan="2">0.94 (0.92-0.95)</td>
                <td colspan="2">0.90 (0.89-0.91)</td>
                <td>0.90 (0.88-0.91)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Low</td>
                <td colspan="2">1.00 (1.00-1.00)<sup>g</sup></td>
                <td colspan="2">0.97 (0.96-0.98)<sup>g</sup></td>
                <td>0.97 (0.96-0.98)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Quarter of the study year</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>First quarter</td>
                <td colspan="2">0.94 (0.91-0.97)</td>
                <td colspan="2">0.91 (0.90-0.93)</td>
                <td>0.91 (0.89-0.93)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Second quarter</td>
                <td colspan="2">0.94 (0.92-0.97)</td>
                <td colspan="2">0.91 (0.90-0.93)</td>
                <td>0.91 (0.89-0.93)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Third quarter</td>
                <td colspan="2">0.95 (0.93-0.97)</td>
                <td colspan="2">0.92 (0.91-0.93)</td>
                <td>0.91 (0.90-0.93)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Fourth quarter</td>
                <td colspan="2">0.95 (0.93-0.97)</td>
                <td colspan="2">0.89 (0.88-0.90)<sup>h</sup></td>
                <td>0.89 (0.87-0.91)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>DeLong test was used for comparing areas under the curve.</p>
            </fn>
            <fn id="table6fn2">
              <p><sup>b</sup><italic>Z</italic> test was used for comparing F1-scores.</p>
            </fn>
            <fn id="table6fn3">
              <p><sup>c</sup>≤65 years versus &#62;65 years; <italic>P&#60;</italic>.001.</p>
            </fn>
            <fn id="table6fn4">
              <p><sup>d</sup>Female versus male; <italic>P&#60;</italic>.001.</p>
            </fn>
            <fn id="table6fn5">
              <p><sup>e</sup>Surgery versus internal medicine or intensive care unit; <italic>P&#60;</italic>.001; Bonferroni adjusted <italic>P</italic>=.003.</p>
            </fn>
            <fn id="table6fn6">
              <p><sup>f</sup>The low, intermediate, and high risks of venous thromboembolism were defined by departments having &#60;1, 1-5, and &#62;5 venous thromboembolism–related deaths per year, respectively.</p>
            </fn>
            <fn id="table6fn7">
              <p><sup>g</sup>Low versus high or intermediate; <italic>P&#60;</italic>.001; Bonferroni adjusted <italic>P</italic>=.003.</p>
            </fn>
            <fn id="table6fn8">
              <p><sup>h</sup>Fourth quarter versus third or second or first quarter; <italic>P&#60;</italic>.001; Bonferroni adjusted <italic>P</italic>=.002.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Diagnostic statistics of the clinical decision support system for venous thromboembolism risk assessment and integrated care for identifying any venous thromboembolism according to different settings. (A) Sensitivity and specificity. (B) Positive and negative predictive values. FN: false negative; FP: false positive; NPV: negative predictive value; PPV: positive predictive value; TN: true negative; TP: true positive; VTE: venous thromboembolism.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e43153_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>Error analysis of the clinical decision support system for venous thromboembolism risk assessment and integrated care for detecting venous thromboembolism.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="810"/>
            <col width="160"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Type of error, reasons for discrepancy</td>
                <td>Values, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>False positive (n=55)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Initially suspected to be venous thromboembolism but subsequently disproved</td>
                <td>29 (53)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Prior venous thromboembolism in the medical history but caught as on-admission venous thromboembolism</td>
                <td>23 (42)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>The admission diagnosis was modified but did not get caught by the system</td>
                <td>3 (5)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>False negative (n=63)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Asymptomatic isolated calf muscle vein thrombosis occurred but not in the discharge diagnosis</td>
                <td>44 (70)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>The admission diagnosis was modified but did not get caught by the system</td>
                <td>12 (19)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unrecognized iliac vein thrombosis</td>
                <td>7 (11)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Subgroup Analysis</title>
        <p>Subgroup analysis of the age, sex, and quarter of the study year demonstrated consistently good performance of the NLP tool in VTE detection with &#62;87% sensitivity, specificity, PPV, and NPV, and &#62;89% of AUC and F1-score. The NLP tool detected VTE in patients aged ≤65 years much better than that in patients aged &#62;65 years (specificity 99.9% vs 99.5%; NPV 99.9% vs 99.5%; LR+ 1494 vs 178; F1-score 0.93 vs 0.89; respectively, all <italic>P</italic>&#60;.001) (<xref ref-type="table" rid="table5">Table 5</xref>, <xref ref-type="table" rid="table6">Table 6</xref>, and <xref rid="figure4" ref-type="fig">Figure 4</xref>).</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>We developed an NLP algorithm with multisource EHR data and validated VTE detection extensively, in relation to different clinical settings with different VTE risks. The main findings of our study were as follows: (1) the NLP algorithm of DeVTEcare facilitated VTE detection with good diagnostic ability; (2) the NLP algorithm consistently detected the on-admission and in-hospital VTE well; however, the NLP algorithm showed higher sensitivity in detecting PE than DVT on admission; (3) among departments of surgery, internal medicine, and intensive care units, the highest specificity and NPV were shown in the surgery department; and (4) the NLP algorithm performed better among departments with low-risk VTE and among patients aged ≤65 years.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>NLP can identify unstructured language that documents the diagnosis or findings of interest. Previous studies [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>] on NLP embedded into EHRs to identify VTE were mainly based on imaging reports. Those studies reported about 94% sensitivity and 89% PPV for patients without surgery but only 81% sensitivity and 54% PPV for patients who had undergone a surgery (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>) [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. The NLP algorithm in our DeVTEcare not only confirmed good sensitivity, specificity, PPV, and NPV for VTE detection for patients admitted to internal medicine units but also for patients in the surgery department with higher specificity, NPV, and F1-scores compared to those for patients in the internal medicine and intensive care units.</p>
        <p>Surgical procedures are associated with increased VTE risk, and certain surgeries, for example, orthopedic surgery, major general surgery, gynecological surgery, urological surgery, and neurosurgery are considered to pose a higher risk for VTE. Our algorithm for VTE detection was extensively validated in these clinical settings and was found to have good diagnostic ability. Our algorithm could help clinicians increase the awareness and prevention of VTE. The good performance of our NLP algorithm may be associated with the use of multisource data from EHRs besides imaging reports and the application of a set of highly optimized and configurable NLP components that enable rapid and straightforward clinical information processing. Moreover, the NLP algorithm of DeVTEcare demonstrated a better identification of on-admission PE than DVT, which was rarely reported by previous studies [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. PE is a more severe clinical issue than DVT; nonetheless, it can be the preventable cause of hospital death. Thus, early identification of patients with PE on admission is critical. The adoption of adequate treatments in such patients during hospitalization would help to reduce adverse outcomes. Since the prevalence of VTE could vary across age, gender, season, and VTE risk, the performance of the NLP algorithm may be affected. However, our study showed that our NLP algorithm performed favorably in VTE identification across all subgroups. In addition, we found that the NLP algorithm detected VTE events even better for patients from departments at low VTE risk and those aged ≤65 years. This could be because VTE occurred less often in these patients, but the NLP system still recognized VTE well and thus showed better specificity while maintaining relatively high sensitivity. The NLP algorithm of DeVTEcare simplified and streamlined the screening of VTE for inpatients in different departments with different risks of VTE, and thus, it can be a user-friendly tool to facilitate the prevention of hospital-associated VTE and related morbidity.</p>
        <p>Finally, the error analysis of our NLP tool for detecting VTE demonstrated that 81% of the false negative events were asymptomatic isolated calf muscle vein thrombosis and iliac vein thrombosis. This could partly explain the higher sensitivity of our NLP tool in PE detection than DVT detection on admission. In addition, 95% of the false positives were from patients with prior VTE or those with suspected VTE on admission but without confirmation of a diagnosis. The results from error analysis suggested that the text mining of key phrases needs to be enhanced furthermore.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>There are several limitations in our study. First, although we tested the NLP algorithm extensively in different clinical settings, we cannot confirm if the findings of our study can be generalized to other hospitals, given the possible differences in the EHR structure, document formatting, and local terminologies. However, the rule-based NLP tool that employs a set of highly optimized and configurable NLP components can be easily tuned with a modest quantity of training data. Second, the VTE risk in the hospital departments was classified by the hospital quality control administration and we did not calculate the incidence rate of VTE, which is the standard procedure in epidemiology studies. Third, some physician-related factors such as the physician’s medical record writing style, awareness of VTE prevention and treatment, and imaging report quality have the potential to influence the NLP algorithm’s ability to identify VTE. Nonetheless, the hospital in our study is an academic teaching hospital in Beijing, which provides the highest quality of medical care in China. Fourth, given the retrospective design of this study, there was possible selection bias, which needs further external validation.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The NLP algorithm of DeVTEcare identified VTE with good diagnostic ability across different clinical settings, especially for the surgery units, departments with low-risk VTE, and patients aged ≤65 years. This algorithm permits us to inform the accurate in-hospital VTE rates and enhance risk-classified VTE integrated care in future research.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Checklist of the Standards for Reporting Diagnostic accuracy studies (STARD) 2015 guidelines.</p>
        <media xlink:href="jmir_v25i1e43153_app1.docx" xlink:title="DOCX File , 31 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Keywords for the natural language processing algorithm in the clinical decision support system for venous thromboembolism risk assessment and integrated care.</p>
        <media xlink:href="jmir_v25i1e43153_app2.docx" xlink:title="DOCX File , 12 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Incidence of venous thromboembolism confirmed by clinical experts according to hospital inpatient department.</p>
        <media xlink:href="jmir_v25i1e43153_app3.docx" xlink:title="DOCX File , 17 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Summary of studies that identify venous thromboembolism using the natural language processing tool.</p>
        <media xlink:href="jmir_v25i1e43153_app4.docx" xlink:title="DOCX File , 29 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">DeVTEcare</term>
          <def>
            <p>clinical decision support system for venous thromboembolism risk assessment and integrated care</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">DVT</term>
          <def>
            <p>deep vein thrombosis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">LR–</term>
          <def>
            <p>negative likelihood ratio</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">LR+</term>
          <def>
            <p>positive likelihood ratio</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">NPV</term>
          <def>
            <p>negative predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">PE</term>
          <def>
            <p>pulmonary embolism</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">PPV</term>
          <def>
            <p>positive predictive value</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">STARD</term>
          <def>
            <p>Standards for Reporting Diagnostic accuracy studies</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">VTE</term>
          <def>
            <p>venous thromboembolism</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The data that support the findings of this study are available from the corresponding author upon reasonable request.</p>
      </sec>
    </notes>
    <ack>
      <p>This research project was funded by the National Natural Science Foundation of China (82170309). We thank Professor Yang Wang (Medical Research and Biometrics Center, National Center for Cardiovascular Disease, Beijing, China) for his instructions on the statistical analysis for this study. We appreciate the DrBreath Company and computer expert Chang-Zheng Li’s technical assistance with the clinical decision support system for venous thromboembolism risk assessment and integrated care (DeVTEcare, DrBreath Co, Ltd, Beijing, China).</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>YG and Y Yao had full access to all of the data in this study and take responsibility for the integrity of the data and the accuracy of the data analysis. YG, Y Yao, ZJ, and HZ contributed to study concept and design. ZJ, YG, MT, HZ, Y Yang, and Y Yao contributed to acquisition, analysis, and interpretation of data. ZJ drafted the manuscript. ZJ, YG, HZ, MT, Y Yang, and Y Yao critically revised the manuscript for important intellectual content. ZJ conducted the statistical analysis. YG obtained funding.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Heit</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Epidemiology of venous thromboembolism</article-title>
          <source>Nat Rev Cardiol</source>
          <year>2015</year>
          <month>08</month>
          <volume>12</volume>
          <issue>8</issue>
          <fpage>464</fpage>
          <lpage>74</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26076949"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/nrcardio.2015.83</pub-id>
          <pub-id pub-id-type="medline">26076949</pub-id>
          <pub-id pub-id-type="pii">nrcardio.2015.83</pub-id>
          <pub-id pub-id-type="pmcid">PMC4624298</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nicholson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bhagirath</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Ginsberg</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Prevention of Venous Thromboembolism in 2020 and Beyond</article-title>
          <source>J Clin Med</source>
          <year>2020</year>
          <month>08</month>
          <day>01</day>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>2467</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=jcm9082467"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/jcm9082467</pub-id>
          <pub-id pub-id-type="medline">32752154</pub-id>
          <pub-id pub-id-type="pii">jcm9082467</pub-id>
          <pub-id pub-id-type="pmcid">PMC7465935</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weller</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Porterfield</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wilkinson</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Baillargeon</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Incidence of venous thrombotic events and events of special interest in a retrospective cohort of commercially insured US patients</article-title>
          <source>BMJ Open</source>
          <year>2022</year>
          <month>02</month>
          <day>09</day>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>e054669</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=35140157"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2021-054669</pub-id>
          <pub-id pub-id-type="medline">35140157</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2021-054669</pub-id>
          <pub-id pub-id-type="pmcid">PMC8829845</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wendelboe</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bratzler</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Beckman</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Reyes</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Raskob</surname>
              <given-names>GE</given-names>
            </name>
          </person-group>
          <article-title>Incidence of Venous Thromboembolism in a Racially Diverse Population of Oklahoma County, Oklahoma</article-title>
          <source>Thromb Haemost</source>
          <year>2021</year>
          <month>06</month>
          <volume>121</volume>
          <issue>6</issue>
          <fpage>816</fpage>
          <lpage>825</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.thieme-connect.com/DOI/DOI?10.1055/s-0040-1722189"/>
          </comment>
          <pub-id pub-id-type="doi">10.1055/s-0040-1722189</pub-id>
          <pub-id pub-id-type="medline">33423245</pub-id>
          <pub-id pub-id-type="pmcid">PMC8180377</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Agnelli</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Arcelus</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bergqvist</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Brecht</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Greer</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Heit</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hutchinson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kakkar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mottier</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Oger</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Samama</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Spannagl</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Venous thromboembolism (VTE) in Europe</article-title>
          <source>Thromb Haemost</source>
          <year>2017</year>
          <month>12</month>
          <day>01</day>
          <volume>98</volume>
          <issue>10</issue>
          <fpage>756</fpage>
          <lpage>764</lpage>
          <pub-id pub-id-type="doi">10.1160/th07-03-0212</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Hang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jia</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Nurses' knowledge, attitudes, and behaviors toward venous thromboembolism prophylaxis: How to do better</article-title>
          <source>Vascular</source>
          <year>2021</year>
          <month>02</month>
          <volume>29</volume>
          <issue>1</issue>
          <fpage>78</fpage>
          <lpage>84</lpage>
          <pub-id pub-id-type="doi">10.1177/1708538120933782</pub-id>
          <pub-id pub-id-type="medline">32576119</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rognoni</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lugli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Maleti</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Tarricone</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Clinical guidelines versus current clinical practice for the management of deep vein thrombosis</article-title>
          <source>J Vasc Surg Venous Lymphat Disord</source>
          <year>2021</year>
          <month>09</month>
          <volume>9</volume>
          <issue>5</issue>
          <fpage>1334</fpage>
          <lpage>1344.e1</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jvsv.2021.01.020</pub-id>
          <pub-id pub-id-type="medline">33744498</pub-id>
          <pub-id pub-id-type="pii">S2213-333X(21)00104-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Henke</surname>
              <given-names>PK</given-names>
            </name>
            <name name-style="western">
              <surname>Kahn</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Pannucci</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Secemksy</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>NS</given-names>
            </name>
            <name name-style="western">
              <surname>Khorana</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Creager</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Pradhan</surname>
              <given-names>AD</given-names>
            </name>
          </person-group>
          <article-title>Call to Action to Prevent Venous Thromboembolism in Hospitalized Patients: A Policy Statement From the American Heart Association</article-title>
          <source>Circulation</source>
          <year>2020</year>
          <month>06</month>
          <day>16</day>
          <volume>141</volume>
          <issue>24</issue>
          <fpage>914</fpage>
          <lpage>31</lpage>
          <pub-id pub-id-type="doi">10.1161/cir.0000000000000769</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Held</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sommervold</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kreuziger</surname>
              <given-names>LB</given-names>
            </name>
          </person-group>
          <article-title>Patient Safety Indicator-12 Rarely Identifies Problems with Quality of Care in Perioperative Venous Thromboembolism</article-title>
          <source>J Hosp Med</source>
          <year>2020</year>
          <month>02</month>
          <volume>15</volume>
          <issue>2</issue>
          <fpage>75</fpage>
          <lpage>80</lpage>
          <pub-id pub-id-type="doi">10.12788/jhm.3298</pub-id>
          <pub-id pub-id-type="medline">31995470</pub-id>
          <pub-id pub-id-type="pii">jhm.3298</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Verma</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Masoom</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Pou-Prom</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Guerzhoy</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fralick</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mamdani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Razak</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Developing and validating natural language processing algorithms for radiology reports compared to ICD-10 codes for identifying venous thromboembolism in hospitalized medical patients</article-title>
          <source>Thromb Res</source>
          <year>2022</year>
          <month>01</month>
          <volume>209</volume>
          <fpage>51</fpage>
          <lpage>58</lpage>
          <pub-id pub-id-type="doi">10.1016/j.thromres.2021.11.020</pub-id>
          <pub-id pub-id-type="medline">34871982</pub-id>
          <pub-id pub-id-type="pii">S0049-3848(21)00529-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Signor</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Lappe</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jenkins</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Wikstrom</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Kroencke</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Hallowell</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Witt</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>A comparison of natural language processing to ICD-10 codes for identification and characterization of pulmonary embolism</article-title>
          <source>Thromb Res</source>
          <year>2021</year>
          <month>07</month>
          <volume>203</volume>
          <fpage>190</fpage>
          <lpage>195</lpage>
          <pub-id pub-id-type="doi">10.1016/j.thromres.2021.04.020</pub-id>
          <pub-id pub-id-type="medline">34044246</pub-id>
          <pub-id pub-id-type="pii">S0049-3848(21)00313-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hurdle</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Ferraro</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Skarda</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Finlayson</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Samore</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Bucher</surname>
              <given-names>BT</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing for the surveillance of postoperative venous thromboembolism</article-title>
          <source>Surgery</source>
          <year>2021</year>
          <month>10</month>
          <volume>170</volume>
          <issue>4</issue>
          <fpage>1175</fpage>
          <lpage>1182</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34090671"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.surg.2021.04.027</pub-id>
          <pub-id pub-id-type="medline">34090671</pub-id>
          <pub-id pub-id-type="pii">S0039-6060(21)00399-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC8490271</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bielinski</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Decker</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Chamberlain</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Roger</surname>
              <given-names>VL</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Larson</surname>
              <given-names>NB</given-names>
            </name>
          </person-group>
          <article-title>Natural Language Processing and Machine Learning for Identifying Incident Stroke From Electronic Health Records: Algorithm Development and Validation</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>03</month>
          <day>08</day>
          <volume>23</volume>
          <issue>3</issue>
          <fpage>e22951</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/3/e22951/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/22951</pub-id>
          <pub-id pub-id-type="medline">33683212</pub-id>
          <pub-id pub-id-type="pii">v23i3e22951</pub-id>
          <pub-id pub-id-type="pmcid">PMC7985804</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Haas</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yadav</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Whitsel</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rosamand</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Heiss</surname>
              <given-names>Gerardo</given-names>
            </name>
            <name name-style="western">
              <surname>Kucharska-Newton</surname>
              <given-names>Anna M</given-names>
            </name>
          </person-group>
          <article-title>Ascertaining Framingham heart failure phenotype from inpatient electronic health record data using natural language processing: a multicentre Atherosclerosis Risk in Communities (ARIC) validation study</article-title>
          <source>BMJ Open</source>
          <year>2021</year>
          <month>06</month>
          <day>14</day>
          <volume>11</volume>
          <issue>6</issue>
          <fpage>e047356</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=34127492"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2020-047356</pub-id>
          <pub-id pub-id-type="medline">34127492</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2020-047356</pub-id>
          <pub-id pub-id-type="pmcid">PMC8204176</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Le Glaz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Haralambous</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kim-Dufor</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lenca</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Billot</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Marsh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>DeVylder</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Walter</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Berrouiguet</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lemey</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Machine Learning and Natural Language Processing in Mental Health: Systematic Review</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>05</month>
          <day>04</day>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>e15708</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/5/e15708/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/15708</pub-id>
          <pub-id pub-id-type="medline">33944788</pub-id>
          <pub-id pub-id-type="pii">v23i5e15708</pub-id>
          <pub-id pub-id-type="pmcid">PMC8132982</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rochefort</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Verma</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Eguale</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Buckeridge</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A novel method of adverse event detection can accurately identify venous thromboembolisms (VTEs) from narrative electronic health record data</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2015</year>
          <month>01</month>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>155</fpage>
          <lpage>65</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25332356"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2014-002768</pub-id>
          <pub-id pub-id-type="medline">25332356</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2014-002768</pub-id>
          <pub-id pub-id-type="pmcid">PMC4433368</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wendelboe</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Saber</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Dvorak</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Adamski</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Feland</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Reyes</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Abe</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ortel</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Raskob</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Exploring the Applicability of Using Natural Language Processing to Support Nationwide Venous Thromboembolism Surveillance: Model Evaluation Study</article-title>
          <source>JMIR Bioinform Biotech</source>
          <year>2022</year>
          <month>8</month>
          <day>5</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>e36877</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bioinform.jmir.org/2022/1/e36877/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/36877</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Woller</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Daw</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Aston</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Lloyd</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Snow</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Woller</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bledsoe</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Natural Language Processing Performance for the Identification of Venous Thromboembolism in an Integrated Healthcare System</article-title>
          <source>Clin Appl Thromb Hemost</source>
          <year>2021</year>
          <volume>27</volume>
          <fpage>10760296211013108</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/abs/10.1177/10760296211013108?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/10760296211013108</pub-id>
          <pub-id pub-id-type="medline">33906470</pub-id>
          <pub-id pub-id-type="pmcid">PMC8107936</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huesch</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Cherian</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Labib</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mahraj</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Evaluating Report Text Variation and Informativeness: Natural Language Processing of CT Chest Imaging for Pulmonary Embolism</article-title>
          <source>J Am Coll Radiol</source>
          <year>2018</year>
          <month>03</month>
          <volume>15</volume>
          <issue>3 Pt B</issue>
          <fpage>554</fpage>
          <lpage>562</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jacr.2017.12.017</pub-id>
          <pub-id pub-id-type="medline">29396123</pub-id>
          <pub-id pub-id-type="pii">S1546-1440(17)31653-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dantes</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Beckman</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Krishnaswamy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Richardson</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Chernetsky-Tejedor</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Improved Identification of Venous Thromboembolism From Electronic Medical Records Using a Novel Information Extraction Software Platform</article-title>
          <source>Med Care</source>
          <year>2018</year>
          <month>09</month>
          <volume>56</volume>
          <issue>9</issue>
          <fpage>e54</fpage>
          <lpage>e60</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29087984"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MLR.0000000000000831</pub-id>
          <pub-id pub-id-type="medline">29087984</pub-id>
          <pub-id pub-id-type="pmcid">PMC5927846</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Swartz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Koziatek</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Theobald</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Iturrate</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Creation of a simple natural language processing tool to support an imaging utilization quality dashboard</article-title>
          <source>Int J Med Inform</source>
          <year>2017</year>
          <month>05</month>
          <volume>101</volume>
          <fpage>93</fpage>
          <lpage>99</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2017.02.011</pub-id>
          <pub-id pub-id-type="medline">28347453</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(17)30050-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gálvez</surname>
              <given-names>Jorge A</given-names>
            </name>
            <name name-style="western">
              <surname>Pappas</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Ahumada</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>JN</given-names>
            </name>
            <name name-style="western">
              <surname>Simpao</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>Rehman</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Witmer</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>The use of natural language processing on pediatric diagnostic radiology reports in the electronic health record to identify deep venous thrombosis in children</article-title>
          <source>J Thromb Thrombolysis</source>
          <year>2017</year>
          <month>10</month>
          <volume>44</volume>
          <issue>3</issue>
          <fpage>281</fpage>
          <lpage>290</lpage>
          <pub-id pub-id-type="doi">10.1007/s11239-017-1532-y</pub-id>
          <pub-id pub-id-type="medline">28815363</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11239-017-1532-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tian</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Eguale</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Rochefort</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Automated Extraction of VTE Events From Narrative Radiology Reports in Electronic Health Records: A Validation Study</article-title>
          <source>Med Care</source>
          <year>2017</year>
          <month>10</month>
          <volume>55</volume>
          <issue>10</issue>
          <fpage>e73</fpage>
          <lpage>e80</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25924079"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MLR.0000000000000346</pub-id>
          <pub-id pub-id-type="medline">25924079</pub-id>
          <pub-id pub-id-type="pmcid">PMC5603980</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Selby</surname>
              <given-names>LV</given-names>
            </name>
            <name name-style="western">
              <surname>Narain</surname>
              <given-names>WR</given-names>
            </name>
            <name name-style="western">
              <surname>Russo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Strong</surname>
              <given-names>VE</given-names>
            </name>
            <name name-style="western">
              <surname>Stetson</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Autonomous detection, grading, and reporting of postoperative complications using natural language processing</article-title>
          <source>Surgery</source>
          <year>2018</year>
          <month>12</month>
          <volume>164</volume>
          <issue>6</issue>
          <fpage>1300</fpage>
          <lpage>1305</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30056994"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.surg.2018.05.008</pub-id>
          <pub-id pub-id-type="medline">30056994</pub-id>
          <pub-id pub-id-type="pii">S0039-6060(18)30219-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC6784320</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bossuyt</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Reitsma</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bruns</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gatsonis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Glasziou</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Irwig</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lijmer</surname>
              <given-names>Jeroen G</given-names>
            </name>
            <name name-style="western">
              <surname>Moher</surname>
              <given-names>David</given-names>
            </name>
            <name name-style="western">
              <surname>Rennie</surname>
              <given-names>Drummond</given-names>
            </name>
            <name name-style="western">
              <surname>de Vet</surname>
              <given-names>Henrica C W</given-names>
            </name>
            <name name-style="western">
              <surname>Kressel</surname>
              <given-names>Herbert Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rifai</surname>
              <given-names>Nader</given-names>
            </name>
            <name name-style="western">
              <surname>Golub</surname>
              <given-names>Robert M</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>Douglas G</given-names>
            </name>
            <name name-style="western">
              <surname>Hooft</surname>
              <given-names>Lotty</given-names>
            </name>
            <name name-style="western">
              <surname>Korevaar</surname>
              <given-names>Daniël A</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>Jérémie F</given-names>
            </name>
            <collab>STARD Group</collab>
          </person-group>
          <article-title>STARD 2015: an updated list of essential items for reporting diagnostic accuracy studies</article-title>
          <source>BMJ</source>
          <year>2015</year>
          <month>10</month>
          <day>28</day>
          <volume>351</volume>
          <fpage>h5527</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.bmj.com/lookup/pmidlookup?view=long&#38;pmid=26511519"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.h5527</pub-id>
          <pub-id pub-id-type="medline">26511519</pub-id>
          <pub-id pub-id-type="pmcid">PMC4623764</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Expert</surname>
              <given-names>COGFTPOTDIC</given-names>
            </name>
          </person-group>
          <article-title>Chinese Guidelines for the Prevention and Treatment of Thrombophilia</article-title>
          <source>National Medical Journal of China</source>
          <year>2018</year>
          <volume>98</volume>
          <issue>36</issue>
          <fpage>2861</fpage>
          <lpage>2888</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://rs.yiigle.com/CN112137201836/1066358.htm"/>
          </comment>
          <pub-id pub-id-type="doi">10.3760/cma.j.issn.0376-2491.2018.36.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <source>Notice on launching the work related to the performance appraisal of national tertiary public hospitals in 2019</source>
          <access-date>2023-03-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.nhc.gov.cn/yzygj/s3593g/201904/b8323261bb8a4175a2046d2fffa93936.shtml">http://www.nhc.gov.cn/yzygj/s3593g/201904/b8323261bb8a4175a2046d2fffa93936.shtml</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <source>Mayo Clinic</source>
          <access-date>2023-03-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mayoclinic.org/zh-hans/diseases-conditions">https://www.mayoclinic.org/zh-hans/diseases-conditions</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marill</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>KF</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>AB</given-names>
            </name>
          </person-group>
          <article-title>Estimating negative likelihood ratio confidence when test sensitivity is 100%: A bootstrapping approach</article-title>
          <source>Stat Methods Med Res</source>
          <year>2017</year>
          <month>08</month>
          <volume>26</volume>
          <issue>4</issue>
          <fpage>1936</fpage>
          <lpage>1948</lpage>
          <pub-id pub-id-type="doi">10.1177/0962280215592907</pub-id>
          <pub-id pub-id-type="medline">26152746</pub-id>
          <pub-id pub-id-type="pii">0962280215592907</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gorfine</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>De-Picciotto</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Conditional and Marginal Estimates in Case-Control Family Data - Extensions and Sensitivity Analyses</article-title>
          <source>J Stat Comput Simul</source>
          <year>2012</year>
          <month>10</month>
          <day>01</day>
          <volume>82</volume>
          <issue>10</issue>
          <fpage>1449</fpage>
          <lpage>1470</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23002315"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/00949655.2011.581669</pub-id>
          <pub-id pub-id-type="medline">23002315</pub-id>
          <pub-id pub-id-type="pmcid">PMC3446754</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>FitzHenry</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Murff</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Matheny</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gentry</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Fielstein</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Reeves</surname>
              <given-names>Ruth M</given-names>
            </name>
            <name name-style="western">
              <surname>Aronsky</surname>
              <given-names>Dominik</given-names>
            </name>
            <name name-style="western">
              <surname>Elkin</surname>
              <given-names>Peter L</given-names>
            </name>
            <name name-style="western">
              <surname>Messina</surname>
              <given-names>Vincent P</given-names>
            </name>
            <name name-style="western">
              <surname>Speroff</surname>
              <given-names>Theodore</given-names>
            </name>
          </person-group>
          <article-title>Exploring the frontier of electronic health record surveillance: the case of postoperative complications</article-title>
          <source>Med Care</source>
          <year>2013</year>
          <month>06</month>
          <volume>51</volume>
          <issue>6</issue>
          <fpage>509</fpage>
          <lpage>16</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23673394"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MLR.0b013e31828d1210</pub-id>
          <pub-id pub-id-type="medline">23673394</pub-id>
          <pub-id pub-id-type="pii">00005650-201306000-00006</pub-id>
          <pub-id pub-id-type="pmcid">PMC3658153</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Murff</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>FitzHenry</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Matheny</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Gentry</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kotter</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Crimin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dittus</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Rosen</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Elkin</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Speroff</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Automated identification of postoperative complications within an electronic medical record using natural language processing</article-title>
          <source>JAMA</source>
          <year>2011</year>
          <month>08</month>
          <day>24</day>
          <volume>306</volume>
          <issue>8</issue>
          <fpage>848</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2011.1204</pub-id>
          <pub-id pub-id-type="medline">21862746</pub-id>
          <pub-id pub-id-type="pii">306/8/848</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
