<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v24i8e37486</article-id>
      <article-id pub-id-type="pmid">35921141</article-id>
      <article-id pub-id-type="doi">10.2196/37486</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Improving the Performance of Outcome Prediction for Inpatients With Acute Myocardial Infarction Based on Embedding Representation Learned From Electronic Medical Records: Development and Validation Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Nuutinen</surname>
            <given-names>Mikko</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Jorm</surname>
            <given-names>Louisa</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Qian</surname>
            <given-names>Buyue</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>Yanqun</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8111-6352</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Zheng</surname>
            <given-names>Zhimin</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6656-7195</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Ma</surname>
            <given-names>Moxuan</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9941-5569</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Xin</surname>
            <given-names>Xin</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0315-3518</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Honglei</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5518-4749</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Fei</surname>
            <given-names>Xiaolu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7498-0249</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Wei</surname>
            <given-names>Lan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1128-1314</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Hui</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>School of Biomedical Engineering</institution>
            <institution>Capital Medical University</institution>
            <addr-line>No. 10, Xitoutiao, You An Men, Fengtai District</addr-line>
            <addr-line>Beijing, 100069</addr-line>
            <country>China</country>
            <phone>86 01083911545</phone>
            <email>chenhui@ccmu.edu.cn</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0048-0193</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>School of Biomedical Engineering</institution>
        <institution>Capital Medical University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Beijing Key Laboratory of Fundamental Research on Biomechanics in Clinical Application</institution>
        <institution>Capital Medical University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Information Center</institution>
        <institution>Xuanwu Hospital</institution>
        <institution>Capital Medical University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Hui Chen <email>chenhui@ccmu.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>8</month>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>3</day>
        <month>8</month>
        <year>2022</year>
      </pub-date>
      <volume>24</volume>
      <issue>8</issue>
      <elocation-id>e37486</elocation-id>
      <history>
        <date date-type="received">
          <day>22</day>
          <month>2</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>20</day>
          <month>4</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>2</day>
          <month>6</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>18</day>
          <month>7</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Yanqun Huang, Zhimin Zheng, Moxuan Ma, Xin Xin, Honglei Liu, Xiaolu Fei, Lan Wei, Hui Chen. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 03.08.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2022/8/e37486" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The widespread secondary use of electronic medical records (EMRs) promotes health care quality improvement. Representation learning that can automatically extract hidden information from EMR data has gained increasing attention.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aimed to propose a patient representation with more feature associations and task-specific feature importance to improve the outcome prediction performance for inpatients with acute myocardial infarction (AMI).</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Medical concepts, including patients’ age, gender, disease diagnoses, laboratory tests, structured radiological features, procedures, and medications, were first embedded into real-value vectors using the improved skip-gram algorithm, where concepts in the context windows were selected by feature association strengths measured by association rule confidence. Then, each patient was represented as the sum of the feature embeddings weighted by the task-specific feature importance, which was applied to facilitate predictive model prediction from global and local perspectives. We finally applied the proposed patient representation into mortality risk prediction for 3010 and 1671 AMI inpatients from a public data set and a private data set, respectively, and compared it with several reference representation methods in terms of the area under the receiver operating characteristic curve (AUROC), area under the precision-recall curve (AUPRC), and F1-score.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Compared with the reference methods, the proposed embedding-based representation showed consistently superior predictive performance on the 2 data sets, achieving mean AUROCs of 0.878 and 0.973, AUPRCs of 0.220 and 0.505, and F1-scores of 0.376 and 0.674 for the public and private data sets, respectively, while the greatest AUROCs, AUPRCs, and F1-scores among the reference methods were 0.847 and 0.939, 0.196 and 0.283, and 0.344 and 0.361 for the public and private data sets, respectively. Feature importance integrated in patient representation reflected features that were also critical in prediction tasks and clinical practice.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The introduction of feature associations and feature importance facilitated an effective patient representation and contributed to prediction performance improvement and model interpretation.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>representation learning</kwd>
        <kwd>skip-gram</kwd>
        <kwd>feature association strengths</kwd>
        <kwd>feature importance</kwd>
        <kwd>mortality risk prediction</kwd>
        <kwd>acute myocardial infarction</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Electronic medical records (EMRs) contain diverse and heterogeneous information, such as demographic data, disease diagnoses, laboratory tests, radiological findings, examinations and procedures, and medications. EMR data can be used to not only reflect the health status of patients and record the treatment trajectory, but also help doctors in making clinical decisions [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref6">6</xref>] and improving the efficiency of diagnosis and treatment [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. One of the most prevalent and practical tasks of the secondary use of EMR data is building models to predict the disease status [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>] and treatment outcomes [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref17">17</xref>] for a patient, using machine learning algorithms.</p>
      <p>However, the high dimensionality, sparsity, and heterogeneity of EMR data [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref18">18</xref>] pose many obstacles for directly inputting the raw data into machine learning–based predictive models. Some manual and data-driven feature engineering methods [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref19">19</xref>], though time-consuming and laborious, were used to select important features or extract useful information for predictive tasks. Moreover, the performance of predictive models relies heavily on the representation of data. It was reported that effective representation methods could make the downstream modeling simpler and more flexible, and greatly improve the predictive performance [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. By transforming raw features into compact vectors, representation learning can make it easier to automatically extract useful information when building predictive models [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. One widely used representation method for EMR data is the skip-gram algorithm [<xref ref-type="bibr" rid="ref23">23</xref>], a distributed embedding method that treats patient records as sentences and medical concepts as words. An inevitable problem in the skip-gram algorithm is that contrary to words within a sentence, medical concepts in a patient’s record do not have a natural order, making it difficult to learn meaningful representations of concepts that have potential associations. One solution for this problem was randomly shuffling the concepts within a record to learn concept embeddings [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. It could reduce the impact of the disorder attribute of medical concepts on the algorithm to some degree, while associations among these concepts were still not taken into consideration.</p>
      <p>Acute myocardial infarction (AMI) is an acute ischemic heart disease and is the second leading cause of death. One in every 6 deaths is caused by ischemic heart disease, where AMI accounts for the majority of deaths [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. Mortality risk prediction for AMI patients plays a crucial role in clinical work, helping doctors identify potential clinical factors, take early intervention measures based on timely alerts of patients’ adverse health statuses, and reduce the burdensome expenditure of related health care expenses. Therefore, researchers [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref31">31</xref>] have focused on building machine learning models for the outcome prediction of AMI patients, and most of them used specific clinical features, such as laboratory test results (eg, albumin), comorbidities (eg, diabetes), and demographic data (eg, gender).</p>
      <p>In this study, we aimed to represent various structured features extracted from EMR data as fixed-length embedding vectors, which were then used to improve the performance of predictive models for the death risk of AMI patients. Specifically, we introduced the association strengths into the skip-gram algorithm to learn more informative representations of features. We also introduced the Shapley additive explanations (SHAP) [<xref ref-type="bibr" rid="ref32">32</xref>] technique to facilitate representation at the patient level and enhance the interpretability of the predictive model. An overview of our proposed representation learning framework and its application is shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>.</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Overview of the proposed representation learning method for patients’ mortality risk prediction. First, feature representations were learned by the skip-gram algorithm using an adaptive context window. Then, patient representations were constructed based on feature representations weighted by the feature importance. Finally, the proposed patient representation was applied in the mortality risk prediction for acute myocardial infarction in-patients from a public data set and a private data set, and compared with reference methods.</p>
        </caption>
        <graphic xlink:href="jmir_v24i8e37486_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Skip-Gram–Based Patient Representation</title>
        <p>The representation was learned hierarchically at the following 3 levels: the concept, feature, and patient levels. At the concept level, we employed the improved skip-gram algorithm [<xref ref-type="bibr" rid="ref23">23</xref>] to represent a concept as an embedding vector. In the natural language processing domain, the basic idea of skip-gram was to maximize the occurrence probabilities of the target words and the context words in the predefined context window, making the words that appear in the same context window closer in the embedding space. Unlike words with natural orders in a sentence, medical concepts appeared out of order in a patient record for a certain hospital stay. This made it difficult to determine the context window that contained relevant concepts for the target concept, especially when the number of concepts in a record was far larger than the size of the context window. Thus, for a concept within a record, we identified relevant concepts using its association strength with a candidate concept in the same record. The association strength was defined as the confidence (equation 1) of an association rule with one candidate concept as the unique antecedent (or consequent).</p>
        <disp-formula>Confidence (C1, C2) = &#124;C1∩C2&#124; / &#124;C1&#124; <bold>(1)</bold></disp-formula>
        <p>where C1 and C2 are the antecedent and consequent concepts, respectively, of an association rule C1→C2, and &#124;C1&#124; and &#124;C1∩C2&#124; are the numbers of patient records containing C1 and both C1 and C2, respectively. The greater the confidence, the stronger the association between the 2 concepts. Antecedent (or consequent) concepts in association rules with the top N highest confidences were included in the context window of the target concept. We called these selection schemes of context concepts <italic>antecedent-based</italic> (or <italic>consequent-based</italic>) embeddings. <xref rid="figure2" ref-type="fig">Figure 2</xref> provides an example of the consequent-based selection scheme of context concepts.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>An illustration of context concept selection for the skip-gram algorithm using association strengths. All records are composed of 10 concepts (C1, C2, ……, and C10). In the confidence matrix, element Cij was the confidence of the association rule with Cj as antecedent and Ci as consequent. For patient 1 with 6 concepts (C1, C3, C6, C7, C8, and C10), the included concepts in C1’s 4-concept context window were selected from the remining 5 candidate concepts, whose confidences were 0.66 (antecedent, C10), 0.62 (C3), 0.55 (C6), 0.53 (C8), and 0.46 (C7). Therefore, C10, C3, C6, and C8 were selected to construct the context window for C1.</p>
          </caption>
          <graphic xlink:href="jmir_v24i8e37486_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Moreover, to reduce the high dimensionality and sparsity of a large number of concepts, while preserving the clinical information as much as possible, we aggregated the concepts of disease diagnoses and procedures into several clinically meaningful feature groups according to International Classification of Diseases, 10th revision (ICD-10) codes and International Classification of Diseases, 9th revision (ICD-9) codes, and with the help of clinical experts. For example, disease diagnoses of type 1 diabetes mellitus and type 2 diabetes mellitus were grouped into the feature group of diabetes mellitus. The average of all embedding vectors of concepts from the same feature group in a patient record was treated as the representation at the feature level for the patient.</p>
        <p>The representation at the patient level was the weighted sum of feature-level representations. The feature weights were obtained under the guidance of the predictive task, indicating the importance of each feature involved in the patient representation. In this study, we used SHAP values as the feature weights. The SHAP framework is a machine learning interpretation technique based on the idea of game theory. It approximated a trained prediction model with a different but simple model that could easily calculate the contribution in the form of a SHAP value for each feature in the prediction model and performed additive feature attribution to explain the combination of features [<xref ref-type="bibr" rid="ref32">32</xref>]. A positive or negative SHAP value reflected a positive or negative influence on the prediction. A feature’s importance was then computed as the average of its absolute SHAP values from all samples.</p>
      </sec>
      <sec>
        <title>Experiments and Evaluations</title>
        <sec>
          <title>Data Sets and Data Preprocessing</title>
          <p>In this study, we used a public data set, the freely accessible critical care database Medical Information Mart for Intensive Care III (MIMIC-III data set [<xref ref-type="bibr" rid="ref33">33</xref>]), and a private data set for the experiments.</p>
          <p>The MIMIC-III data set was collected between June 2001 and October 2012, and involved 46,520 patients admitted to intensive care units at the Beth Israel Deaconess Medical Center in Boston, Massachusetts. It includes patient health information, such as demographics, vital signs, laboratory test results, medications, procedures, diagnosis codes, and clinical notes. The informative MIMIC-III data set was widely used in some medical machine learning modeling and algorithm evaluations, providing strong data support for researchers to establish models and evaluate algorithms [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref18">18</xref>].</p>
          <p>The private data set was derived from the EMR system of a tertiary hospital, Xuanwu Hospital, Capital Medical University, Beijing, China, between January 2014 and December 2016. Patient features included hospital admission and discharge information, demographic data, disease diagnoses, laboratory tests, examinations and procedures, medications, and radiology reports of chest X-ray or color sonography examination.</p>
          <p>We extracted the records of all 3010 and 1671 AMI patients from the public and private data sets, respectively. The diagnosis of AMI was confirmed with the ICD-9 codes 410.01 to 410.91 or ICD-10 codes I21 and I22. There were 254 (8.1%) and 103 (6.2%) patients who died in the hospital from the public and private data sets, respectively.</p>
          <p>We maintained patients’ first hospitalization data to evaluate the proposed method. Demographic data (age and gender) and the following AMI-related features were maintained in both data sets: AMI-relevant items of laboratory tests that at least 95% of patients carried out, AMI-relevant radiological features extracted from radiology reports [<xref ref-type="bibr" rid="ref34">34</xref>], 7 commonly prescribed medications, and all recorded disease diagnoses and procedures. For laboratory tests performed more than once, only the results obtained in the first test (usually at admission) were retained, which could reflect a patient’s health status and the severity of illness.</p>
          <p>Since initially proposed in the field of natural language processing, the skip-gram algorithm was used to train embeddings for discrete words or symbols. Therefore, to use the skip-gram algorithm for the embedding representation of the structured data, all patient features should be categorical, where each discrete value is treated as a concept. For example, male and female were 2 concepts for gender. Different from raw categorical features, such as gender, disease diagnoses, procedures, and medications, that might remain unchanged, the continuous variables age and laboratory test results had to be discretized into two or more concepts. Age was discretized into 2 concepts (&#62;60 years and ≤60 years). Each laboratory test result was also discretized into 2 concepts (normal and abnormal with reference to clinical standards). In total, 3326 and 1073 medical concepts were identified and further aggregated to 104 and 108 feature groups in the public and private data sets, respectively (<xref ref-type="table" rid="table1">Table 1</xref>). All feature groups of the private and public data sets are listed in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> and <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>, respectively.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Concepts and feature groups of both the public and private data sets.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="160"/>
              <col width="120"/>
              <col width="110"/>
              <col width="0"/>
              <col width="120"/>
              <col width="110"/>
              <col width="0"/>
              <col width="380"/>
              <thead>
                <tr valign="top">
                  <td>Feature category</td>
                  <td colspan="3">Public data set</td>
                  <td colspan="3">Private data set</td>
                  <td>Concept examples</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Feature groups (n=104), n</td>
                  <td>Concepts (n=3326), n</td>
                  <td colspan="2">Feature groups (n=108), n</td>
                  <td>Concepts (n=1073), n</td>
                  <td colspan="2">
                    <break/>
                  </td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Age</td>
                  <td>1</td>
                  <td>2</td>
                  <td colspan="2">1</td>
                  <td>2</td>
                  <td colspan="2">&#62;60 years and ≤60 years</td>
                </tr>
                <tr valign="top">
                  <td>Gender</td>
                  <td>1</td>
                  <td>2</td>
                  <td colspan="2">1</td>
                  <td>2</td>
                  <td colspan="2">Male and female</td>
                </tr>
                <tr valign="top">
                  <td>Laboratory tests</td>
                  <td>19</td>
                  <td>38</td>
                  <td colspan="2">40</td>
                  <td>80</td>
                  <td colspan="2">Abnormal serum triglyceride and normal serum creatinine</td>
                </tr>
                <tr valign="top">
                  <td>Radiological features</td>
                  <td>34</td>
                  <td>34</td>
                  <td colspan="2">36</td>
                  <td>36</td>
                  <td colspan="2">Cardiac image enlargement and sharp costophrenic angle</td>
                </tr>
                <tr valign="top">
                  <td>Disease diagnoses</td>
                  <td>24</td>
                  <td>2600</td>
                  <td colspan="2">15</td>
                  <td>739</td>
                  <td colspan="2">Hypertension and brainstem infarction</td>
                </tr>
                <tr valign="top">
                  <td>Procedures</td>
                  <td>18</td>
                  <td>643</td>
                  <td colspan="2">8</td>
                  <td>207</td>
                  <td colspan="2">Coronary stenting and pericardiocentesis</td>
                </tr>
                <tr valign="top">
                  <td>Medications</td>
                  <td>7</td>
                  <td>7</td>
                  <td colspan="2">7</td>
                  <td>7</td>
                  <td colspan="2">Angiotensin-converting enzyme inhibitor and heparin</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
        </sec>
        <sec>
          <title>Representation Evaluation</title>
          <p>To evaluate the effectiveness and advantages of the proposed representation, we used 2 additional kinds of simple reference representation methods, namely, the 3-layer autoencoder with learning and the feature selection method without learning. <xref ref-type="table" rid="table2">Table 2</xref> describes the details of the proposed and reference representation methods.</p>
          <p>The proposed representation method was first evaluated at the concept level. Cluster analyses were used to cluster laboratory test concepts into 2 clusters for the quantitative evaluation. The adjusted Rand index (ARI) [<xref ref-type="bibr" rid="ref35">35</xref>] (ranging from −1 to 1) was used to evaluate the cluster solutions. Greater ARI values indicated higher ability of discriminating from categories with different real labels (normal and abnormal). We also applied the t-distributed stochastic neighbor algorithm to project the embedding vectors of laboratory test concepts into a 2-dimensional space to visually observe the distribution of embeddings.</p>
          <p>The proposed representation method was then evaluated at the patient level with a downstream prediction task using the logistic regression model. The predicted outcome was the in-hospital death of AMI patients during hospital stay. The input for prediction was the patient representation derived from the entire feature set listed in <xref ref-type="table" rid="table1">Table 1</xref>. We also extracted a treatment-free feature subset that excluded medications and procedures from the entire feature set, trying to clarify that the performance of the proposed patient representation was related to the features that were involved in the representation and that the treatment-related features played a crucial role in predicting patient outcome even if they had been represented as embedding vectors.</p>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Descriptions of the proposed and reference representation methods.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="160"/>
              <col width="540"/>
              <col width="300"/>
              <thead>
                <tr valign="top">
                  <td>Representation method</td>
                  <td>Descriptions</td>
                  <td>Representation examples</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Mixture</td>
                  <td>The mixture of discretization codes for original discrete features and original values for continuous features. The missing values in the laboratory tests were interpolated using the mean of the corresponding laboratory tests.</td>
                  <td>(0,1,1,0,0,0,1,12,8.5,3,8) for a patient with 11 features</td>
                </tr>
                <tr valign="top">
                  <td>Discretization</td>
                  <td>The 0-1 vector where the digit 1 represented the patient having the specific disease, procedure, radiological feature, and medication, and 0 otherwise. Age of 1 meant &#62;60 years and 0 meant ≤60 years, gender of 1 meant male and 0 meant female, and a laboratory test item of 1 meant abnormal and 0 meant normal. Missing values for laboratory tests were interpolated by the corresponding mode.</td>
                  <td>(0,1,1,0,0,0,1,1,0,1,1) for a patient with 11 discretization features</td>
                </tr>
                <tr valign="top">
                  <td>DIS_FS<sup>a</sup></td>
                  <td>The selected features with discretization representations were statistically different between patients with and without the label “death.”</td>
                  <td>(0,0,1,0,0,1,0,1) for a patient with 8 selected features</td>
                </tr>
                <tr valign="top">
                  <td>DIS_AE<sup>b</sup></td>
                  <td>The hidden-layer vector of a 3-layer autoencoder with discretization vectors as inputs and outputs. The dimension of the hidden layer was set to 64.</td>
                  <td>(0.7,1.9,0.5,−1,−3.1,2.4) for a patient with a 6-dimensional vector</td>
                </tr>
                <tr valign="top">
                  <td>RAN_EM_AVE<sup>c</sup></td>
                  <td>The average of feature embedding vectors learned from the skip-gram algorithm using the random selection method to determine the context window.</td>
                  <td>(1.6,−0.5,1.1,0.1,−1.3,0.6) for a patient with a 6-dimensional embedding vector</td>
                </tr>
                <tr valign="top">
                  <td>RAN_EM_WGT<sup>d</sup></td>
                  <td>The weighted sum of the feature embedding vectors learned from the skip-gram algorithm using the random selection method to determine the context window.</td>
                  <td>(1.2,−0.9,1.3,0.4,−1.9,1.0) for a patient with a 6-dimensional embedding vector</td>
                </tr>
                <tr valign="top">
                  <td>ANT_EM_AVE<sup>e</sup></td>
                  <td>The average of the feature embedding vectors learned from the skip-gram algorithm using the confidence with the target concept as the antecedent.</td>
                  <td>(0.9,−0.6,1.2,1.4,−1.9,0.6) for a patient with a 6-dimensional embedding vector</td>
                </tr>
                <tr valign="top">
                  <td>ANT_EM_WGT<sup>f</sup></td>
                  <td>The weighted sum of the feature embedding vectors learned from the skip-gram algorithm using the confidence with the target concept as the antecedent.</td>
                  <td>(1.2,−1.5,1.1,0.1,−0.6,0.6) for a patient with a 6-dimensional embedding vector</td>
                </tr>
                <tr valign="top">
                  <td>CON_EM_AVE<sup>g</sup></td>
                  <td>The average of the feature embedding vectors learned from the skip-gram algorithm using the confidence with the target concept as the consequent.</td>
                  <td>(1.6,−0.8,2.1,1.6,−1.4,1.5) for a patient with a 6-dimensional embedding vector</td>
                </tr>
                <tr valign="top">
                  <td>CON_EM_WGT<sup>h</sup></td>
                  <td>The weighted sum of the feature embedding vectors learned from the skip-gram algorithm using the confidence with the target concept as the consequent.</td>
                  <td>(1.1,−0.4,−0.7,1.6,−0.3,0.9) for a patient with a 6-dimensional embedding vector</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table2fn1">
                <p><sup>a</sup>DIS_FS: discretization representations with feature selection.</p>
              </fn>
              <fn id="table2fn2">
                <p><sup>b</sup>DIS_AE: hidden vector of an autoencoder-based representation.</p>
              </fn>
              <fn id="table2fn3">
                <p><sup>c</sup>RAN_EM_AVE: average of the random selection–based embedding representation.</p>
              </fn>
              <fn id="table2fn4">
                <p><sup>d</sup>RAN_EM_WGT: weighted sum of the random selection–based embedding representation.</p>
              </fn>
              <fn id="table2fn5">
                <p><sup>e</sup>ANT_EM_AVE: average of the antecedent-based embedding representation.</p>
              </fn>
              <fn id="table2fn6">
                <p><sup>f</sup>ANT_EM_WGT: weighted sum of the antecedent-based embedding representation.</p>
              </fn>
              <fn id="table2fn7">
                <p><sup>g</sup>CON_EM_AVE: average of the consequent-based embedding representation.</p>
              </fn>
              <fn id="table2fn8">
                <p><sup>h</sup>CON_EM_WGT: weighted sum of the consequent-based embedding representation.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <p>We randomly split samples into training and test data sets by the ratio of 7:3. The training samples were first represented in the discretization vectors and used to build a predictive model for calculating all features’ SHAP values for the further patient embedding representations of all study samples. After being represented as embedding vectors, the training and test samples were used to build and validate a logistic regression-based predictive model, respectively. The area under the receiver operating characteristic curve (AUROC), area under the precision-recall curve (AUPRC), and F1-score were the main evaluation metrics. Other relevant performance metrics from the confusion matrix included precision, recall, and accuracy. To eliminate the performance bias introduced by the initialization of a skip-gram model and the training/test data set split, we performed the comparative experiment 100 times. In each experiment round, the above processes were repeated. The mean with its 95% CI of each performance evaluation metric was reported.</p>
          <p>In the skip-gram algorithm, the size of the context window and the dimension of the embedding vector were determined by trial and error. We conducted a group of predictive experiments on the public data set, using possible combinations of window sizes of 5, 10, 15, and 20, and vector dimensions of 50, 100, 200, and 300. Experimental results (listed in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>) showed that the skip-gram algorithm with the combination of a window size of 10 and a vector dimension of 300 had the highest representation performance. Therefore, the size of the context window and the dimension of the embedding vector were set to 10 and 300, respectively. We applied the negative sampling mechanism (20 negative samples in this study) to accelerate the concept embedding training process. Other parameters were as follows: learning rate, 0.001; number of iterations, 50; batch size, 64. The gradient calculation method was Adam. We implemented representation learning, SHAP value computation, and prediction modeling in Python 3.7 and TensorFlow 2.0. In the step of patient representation, we used the L2 regularization penalty with “liblinear” solver for the logistic regression model, and the inverse of regularization strength was set to 0.1.</p>
        </sec>
      </sec>
      <sec>
        <title>Ethics Approval</title>
        <p>The study was approved by the Human Research Ethics Committees of Xuanwu Hospital, Capital Medical University (approval number: Clinical Scientific Research 2020-070).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Concept Representation Evaluation</title>
        <p>Embedding vectors for laboratory test concepts were visualized in a plane space (<xref rid="figure3" ref-type="fig">Figure 3</xref>). Concepts of normal and abnormal laboratory tests (<xref rid="figure3" ref-type="fig">Figure 3</xref>) were farther away when they were represented by the consequent-based embeddings (<xref rid="figure3" ref-type="fig">Figures 3</xref>A and 3D) than by the antecedent-based embeddings (<xref rid="figure3" ref-type="fig">Figures 3</xref>B and 3E) and the random selection–based embeddings (<xref rid="figure3" ref-type="fig">Figures 3</xref>C and 3F). In cluster analyses for laboratory tests, the consequent-based embeddings achieved higher ARIs (0.317 and 0.520 on the public and private data sets, respectively) than the antecedent-based embeddings (0.112 and 0.149, respectively) and the random selection–based embeddings (0.043 and 0.028, respectively). The best cluster performance of the consequent-based embeddings among the 3 embeddings indicated that the consequent-based embeddings might contain more feature association information.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Visualization of the embedding laboratory tests using different selection schemes for contextual concepts in the skip-gram algorithm (the t-distributed stochastic neighbor embedding algorithm was used). Dots in red and green represent abnormal and normal laboratory test results, respectively. A to C for the public data set: the contextual concepts of a target concept consist of its consequent concepts (A) or antecedent concepts (B) in association rules, or randomly selected concepts (C). D to F are the counterparts of A to C on the private data set.</p>
          </caption>
          <graphic xlink:href="jmir_v24i8e37486_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Predictive Performance</title>
        <p><xref ref-type="table" rid="table3">Table 3</xref> and <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref> list the predictive performances using various representation methods on the private and public data sets, respectively. The proposed representation method, the weighted sum of the consequent-based embedding representation (CON_EM_WGT), showed the highest predictive performances, with maximum AUROCs of 0.878, 0.973, and 0.926 using all features of the public data set and the entire and treatment-free feature sets of the private data set, respectively. When the performance was measured by AUPRC and F1-score, the proposed representation method outperformed all the other methods regardless of the data sets and feature sets.</p>
        <p>Compared with the reference representations, most of the embedding-based representations on both data sets showed a performance improvement. The average AUROC, AUPRC, and F1-score of the 6 representation methods with embeddings were greater than those of the 4 reference methods without embeddings (0.855 vs 0.831, 0.203 vs 0.185, and 0.354 vs 0.328, respectively) on the public data set with the entire feature set. Further, among the 6 representations based on the skip-gram algorithm, representations with algorithm improvement based on the association strength achieved superior performance than those without.</p>
        <p>When assembling feature representations into a patient representation, the assembling method and the involved features did matter. Representations based on the idea of weighted sum outperformed those based on the idea of average, on either the public data set with the entire feature set (AUROC, 0.863 to 0.878 vs 0.834 to 0.850) or the private data set with the entire feature set (0.967 to 0.973 vs 0.948 to 0.957). On the other hand, consistently superior predictive performance was achieved on both data sets with the entire feature set compared with the treatment-free feature set. <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref> shows the average predictive performance of patient representation methods on the public and private data sets with and without treatment feature sets.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Predictive performance of patient representation methods on the private data set.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="30"/>
            <col width="280"/>
            <col width="0"/>
            <col width="220"/>
            <col width="0"/>
            <col width="220"/>
            <col width="0"/>
            <col width="220"/>
            <thead>
              <tr valign="top">
                <td colspan="4">Feature set and representation methods</td>
                <td colspan="2">AUROC<sup>a</sup>, mean (95% CI)</td>
                <td colspan="2">AUPRC<sup>b</sup>, mean (95% CI)</td>
                <td>F1-score, mean (95% CI)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="4">
                  <bold>Entire feature set</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Embedding-based representation methods</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>CON_EM_WGT<sup>c</sup></td>
                <td colspan="2">0.973 (0.951-0.995)</td>
                <td colspan="2">0.505 (0.278-0.732)</td>
                <td colspan="2">0.674 (0.468-0.880)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>CON_EM_AVE<sup>d</sup></td>
                <td colspan="2">0.957 (0.933-0.981)</td>
                <td colspan="2">0.312 (0.159-0.465)</td>
                <td colspan="2">0.479 (0.301-0.657)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>ANT_EM_WGT<sup>e</sup></td>
                <td colspan="2">0.972 (0.948-0.996)</td>
                <td colspan="2">0.489 (0.258-0.720)</td>
                <td colspan="2">0.658 (0.442-0.874)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>ANT_EM_AVE<sup>f</sup></td>
                <td colspan="2">0.953 (0.929-0.977)</td>
                <td colspan="2">0.310 (0.185-0.435)</td>
                <td colspan="2">0.478 (0.329-0.627)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>RAN_EM_WGT<sup>g</sup></td>
                <td colspan="2">0.967 (0.942-0.992)</td>
                <td colspan="2">0.486 (0.263-0.709)</td>
                <td colspan="2">0.660 (0.460-0.860)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>RAN_EM_AVE<sup>h</sup></td>
                <td colspan="2">0.948 (0.923-0.973)</td>
                <td colspan="2">0.287 (0.167-0.407)</td>
                <td colspan="2">0.451 (0.306-0.596)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Reference representation methods</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>DIS_AE<sup>i</sup></td>
                <td colspan="2">0.884 (0.845-0.923)</td>
                <td colspan="2">0.207 (0.144-0.270)</td>
                <td colspan="2">0.361 (0.279-0.443)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>DIS_FS<sup>j</sup></td>
                <td colspan="2">0.938 (0.907-0.969)</td>
                <td colspan="2">0.283 (0.167-0.399)</td>
                <td colspan="2">0.452 (0.309-0.595)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Discretization</td>
                <td colspan="2">0.939 (0.908-0.970)</td>
                <td colspan="2">0.283 (0.165-0.401)</td>
                <td colspan="2">0.454 (0.307-0.601)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Mixture</td>
                <td colspan="2">0.904 (0.849-0.959)</td>
                <td colspan="2">0.251 (0.135-0.367)</td>
                <td colspan="2">0.417 (0.264-0.570)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Treatment-free feature set</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Embedding-based representation methods</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>CON_EM_WGT</td>
                <td colspan="2">0.926 (0.883-0.969)</td>
                <td colspan="2">0.282 (0.139-0.425)</td>
                <td colspan="2">0.456 (0.282-0.630)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>CON_EM_AVE</td>
                <td colspan="2">0.915 (0.876-0.954)</td>
                <td colspan="2">0.248 (0.156-0.340)</td>
                <td colspan="2">0.413 (0.297-0.529)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>ANT_EM_WGT</td>
                <td colspan="2">0.919 (0.874-0.964)</td>
                <td colspan="2">0.278 (0.133-0.423)</td>
                <td colspan="2">0.455 (0.275-0.635)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>ANT_EM_AVE</td>
                <td colspan="2">0.912 (0.869-0.955)</td>
                <td colspan="2">0.256 (0.162-0.350)</td>
                <td colspan="2">0.423 (0.307-0.539)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>RAN_EM_WGT</td>
                <td colspan="2">0.915 (0.868-0.962)</td>
                <td colspan="2">0.248 (0.119-0.377)</td>
                <td colspan="2">0.416 (0.238-0.594)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>RAN_EM_AVE</td>
                <td colspan="2">0.897 (0.850-0.944)</td>
                <td colspan="2">0.225 (0.133-0.317)</td>
                <td colspan="2">0.385 (0.265-0.505)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Reference representation methods</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>DIS_AE</td>
                <td colspan="2">0.884 (0.845-0.923)</td>
                <td colspan="2">0.207 (0.144-0.270)</td>
                <td colspan="2">0.361 (0.279-0.443)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>DIS_FS</td>
                <td colspan="2">0.903 (0.862-0.944)</td>
                <td colspan="2">0.214 (0.124-0.304)</td>
                <td colspan="2">0.367 (0.236-0.498)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Discretization</td>
                <td colspan="2">0.905 (0.862-0.948)</td>
                <td colspan="2">0.224 (0.122-0.326)</td>
                <td colspan="2">0.381 (0.238-0.524)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Mixture</td>
                <td colspan="2">0.867 (0.806-0.928)</td>
                <td colspan="2">0.202 (0.116-0.288)</td>
                <td colspan="2">0.356 (0.227-0.485)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>AUPRC: area under the precision-recall curve.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>CON_EM_WGT: weighted sum of the consequent-based embedding representation.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>CON_EM_AVE: average of the consequent-based embedding representation.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>ANT_EM_WGT: weighted sum of the antecedent-based embedding representation.</p>
            </fn>
            <fn id="table3fn6">
              <p><sup>f</sup>ANT_EM_AVE: average of the antecedent-based embedding representation.</p>
            </fn>
            <fn id="table3fn7">
              <p><sup>g</sup>RAN_EM_WGT: weighted sum of the random selection–based embedding representation.</p>
            </fn>
            <fn id="table3fn8">
              <p><sup>h</sup>RAN_EM_AVE: average of the random selection–based embedding representation.</p>
            </fn>
            <fn id="table3fn9">
              <p><sup>i</sup>DIS_AE: discretization representations with features selection.</p>
            </fn>
            <fn id="table3fn10">
              <p><sup>j</sup>DIS_FS: hidden vector of an autoencoder-based representation.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Predictive Model Interpretation</title>
        <p><xref rid="figure4" ref-type="fig">Figure 4</xref> illustrates the global feature attributions for the top 20 most important features from the private data set when predicting in-hospital death risk. The treatment-related features played an important role in the mortality prediction. These features included other surgery (mean absolute SHAP value: 0.413), diagnostic ultrasound (0.279), contrast agent cardiovascular angiography (0.197), etc (<xref rid="figure4" ref-type="fig">Figure 4</xref>A). Moreover, comorbidity diseases like hypertension (mean absolute SHAP value: 0.252) and heart disease complications (0.236), and laboratory tests like serum glucose (0.188) and serum lactate dehydrogenase (0.139) had strong associations with in-hospital death (<xref rid="figure4" ref-type="fig">Figure 4</xref>B). SHAP values of features in the public data set are shown in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>.</p>
        <p>In addition to the feature’s global importance in the specific predictive task, SHAP values were helpful in distinguishing the feature’s local importance, that is, the importance for an individual sample. <xref rid="figure5" ref-type="fig">Figure 5</xref> illustrates how the mortality risk was predicted with SHAP values for a patient who died during hospital stay and another patient who did not die. The positive SHAP values of most features of the patient who died during hospital stay increased the total SHAP value from an average value of −3.739 to a final value of −0.499 (<xref rid="figure5" ref-type="fig">Figures 5</xref>A and 5C), meaning that the patient had a higher risk of in-hospital death than the average. In this incremental process, gender as female, for example, contributed a SHAP value of +0.21 (<xref rid="figure5" ref-type="fig">Figures 5</xref>C). On the contrary, the negative SHAP values of most features of the patient who was discharged alive decreased the total SHAP value from −3.739 to −6.169 (<xref rid="figure5" ref-type="fig">Figures 5</xref>B and 5D), indicating a lower death risk. In this decremental process, male gender contributed a SHAP value of −0.09 (<xref rid="figure5" ref-type="fig">Figures 5</xref>D). We have shown 2 examples of patients from the public data set in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>The mean absolute Shapley additive explanations (SHAP) values of the top 20 features of the private data set within the entire feature set (A) and the treatment-free feature set (B).</p>
          </caption>
          <graphic xlink:href="jmir_v24i8e37486_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Shapley additive explanations (SHAP) values for a patient who died during hospital stay (A and C) and another patient who did not die (B and D). Both patients were selected from the private data set with the entire feature set. A and B, all features with their SHAP values. C and D, 20 features with the greatest absolute SHAP values. Features in blue tend to reduce the possibility of a patient being classified as positive (death in this study), while features in red do the contrary. The meaning of each abbreviated feature name can be found in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
          </caption>
          <graphic xlink:href="jmir_v24i8e37486_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>With the widespread adoption of EMR data in building machine learning–based predictive models, one of the most fundamental research challenges was learning proper patient representations that might capture hidden semantic associations among medical concepts [<xref ref-type="bibr" rid="ref18">18</xref>]. In this study, we proposed an improved skip-gram–based patient representation method where the association strength among medical concepts and the task-specific feature importance were integrated. Compared with other representation methods, the proposed patient representation improved the performance of the mortality risk prediction for AMI patients.</p>
        <p>In previous studies, deep learning models [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref36">36</xref>] were used in training embedding representations of medical concepts for the subsequent patient representation. When using the skip-gram algorithm, the order of medical concepts that was independent of feature relevance hindered the algorithm from learning high-quality representation. Prior work recommended the shuffling mechanism for medical concepts in a patient record to reduce the impact of the out-of-order characteristics on the algorithm [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. In this study, we introduced the association strength between 2 concepts that was defined as the confidence of an association rule involving just the 2 concepts. Experiments from various aspects indicated that this ingenious improvement was effective in revealing potential associations among medical concepts and further enhancing the performance of downstream prediction tasks.</p>
        <p>In addition to the representation algorithm, features used to represent a patient were also critical. Many previous studies focused on some features in the original form of medical codes, such as disease diagnoses, procedures, and medications [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. For laboratory tests that contained much diagnosis and prognosis-relevant information about patients, we included the normal status of the laboratory tests into the feature sets, rather than simply using the number of laboratory tests and test co-occurrences [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. We further extracted radiological features from free-text radiological reports. Admittedly, richer features may lead to a feature representation with more information, even if the dimension of patient representation remains unchanged. In this study, predictive models using more features to represent a patient did reflect more information about the patient and showed higher performance than those using fewer features. Our finding is similar to the results of other studies [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>].</p>
        <p>Prior studies employed neural networks to train predictive models for clinical outcomes using EMR data [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. They focused on end-to-end prediction models built on large data sets, where the last hidden layer of the neural network was regarded as the patient representation. Although the deep end-to-end neural network–based patient representation improved the predictive accuracy, the lack of interpretability could not be ignored. Some studies [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref41">41</xref>] constructed patient representations using the average of concept representations learned by word embedding methods, which did not make full use of the importance of different clinical features for patients. As an advanced interpretability method, the SHAP value [<xref ref-type="bibr" rid="ref32">32</xref>] was successfully used to analyze and explain the predictive models in some previous studies [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref44">44</xref>]. We introduced SHAP values as feature importance into the patient representation, and further explained the predictive model with SHAP values. SHAP values can be used to not only rank the overall importance and identify the important factors for the prediction task, but also explore the key factors for predicting the mortality risk for a specific patient. In our predictive task for AMI patients, the most important features identified by SHAP values were really closely related to AMI [<xref ref-type="bibr" rid="ref45">45</xref>-<xref ref-type="bibr" rid="ref47">47</xref>], such as serum glucose and serum creatine kinase, which are 2 critical laboratory tests for AMI diagnosis and prognosis in clinical practice.</p>
        <p>In our predictive task, the model that took all available patient characteristics represented by the proposed patient representation method as inputs showed a higher performance than other models on the same task in previous studies (AUROC, 0.973 vs 0.905 to 0.935 [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref48">48</xref>]). This may be because the embedding representation contained a large number of diverse features extracted from a general EMR system, while many researchers selected AMI-related features with the assistance of clinical experts. For example, basic demographic data and few laboratory tests, as well as several specific features of AMI like Killip classification and left ventricular ejection fraction [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref30">30</xref>] were directly added into the machine learning model to predict mortality risk. Further, compared with other simple feature extraction methods like Principal Component Analysis [<xref ref-type="bibr" rid="ref29">29</xref>] and the 3-layer autoencoder model, the proposed method took the association strength and feature importance into consideration, achieving higher predictive performance.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This study had some limitations. First, only patients’ laboratory tests for the first time during hospital stay were included in this study, while many patients took two or more laboratory tests. Since temporal data, especially multiple laboratory tests, may reflect the dynamic health status and the treatment effect of a patient over time, the lack of temporal characteristics of laboratory tests in the patient representation may lead to performance loss in downstream tasks. A future study will focus on integrating this uneven and irregular temporal data into the current patient representation. Second, the skip-gram algorithm was used in training concept embeddings. The algorithm is popular in the natural language processing domain, possibly having a limited ability to represent structured and disordered EMR data. A transformer-based pretrain model, Med-Bert, has been trained to represent disease diagnoses originally expressed in ICD-10 and ICD-9 codes, showing higher performance with AUROCs of 85.39% and 82.23% in heart failure and pancreatic cancer prediction tasks, respectively [<xref ref-type="bibr" rid="ref49">49</xref>]. Therefore, more complicated deep learning methods will be adopted for a more informative patient representation in the future. Lastly, we carried out only internal validation of the predictive model built on the proposed patient representation. External validation of high quality will be more convincing and will help in continuous algorithm improvement. Moreover, the chosen reference methods for the performance comparison were simple feature selection methods and a 3-layer autoencoder. Comparison with state-of-the-art methods is needed to evaluate the performance and potential use of our proposed method.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In this study, we improved the embedding-based patient representation with the association strength of medical concepts and importance of patient features. After further training and fine-tuning, the model based on the proposed patient representation will hopefully be used to assist in prognostic prediction for AMI inpatients. This study puts forward a meaningful direction for the development of more effective and efficient clinical prediction models using EMR data. It is desirable for patient representation learning to serve as an essential part of building a predictive model for clinical outcomes.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Patient features of samples in the private data set.</p>
        <media xlink:href="jmir_v24i8e37486_app1.docx" xlink:title="DOCX File , 35 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Patient features of samples in the public MIMIC-III data set.</p>
        <media xlink:href="jmir_v24i8e37486_app2.docx" xlink:title="DOCX File , 34 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Predictive performance of skip-gram–based embedding representations with different combinations of the size of the context window and the dimension of the embedding vector.</p>
        <media xlink:href="jmir_v24i8e37486_app3.docx" xlink:title="DOCX File , 24 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Predictive performance of patient representation methods on the public data set.</p>
        <media xlink:href="jmir_v24i8e37486_app4.docx" xlink:title="DOCX File , 21 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>The average predictive performance of patient representation methods on the public and private data sets with and without treatment feature sets.</p>
        <media xlink:href="jmir_v24i8e37486_app5.docx" xlink:title="DOCX File , 22 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>The mean absolute Shapley additive explanations (SHAP) values of the top 20 features of the public data set within the entire feature set (A) and the treatment-free feature set (B).</p>
        <media xlink:href="jmir_v24i8e37486_app6.docx" xlink:title="DOCX File , 356 KB"/>
      </supplementary-material>
      <supplementary-material id="app7">
        <label>Multimedia Appendix 7</label>
        <p>Shapley additive explanations (SHAP) values for a patient who died during hospital stay (A and C) and another patient who did not die (B and D) from the public data set with the entire feature set.</p>
        <media xlink:href="jmir_v24i8e37486_app7.docx" xlink:title="DOCX File , 394 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AMI</term>
          <def>
            <p>acute myocardial infarction</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ARI</term>
          <def>
            <p>adjusted Rand index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">AUPRC</term>
          <def>
            <p>area under the precision-recall curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">AUROC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">EMR</term>
          <def>
            <p>electronic medical record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">ICD</term>
          <def>
            <p>International Classification of Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">SHAP</term>
          <def>
            <p>Shapley additive explanations</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by the National Natural Science Foundation of China (No. 81971707).</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jing</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Treatment initiation prediction by EHR mapped PPD tensor based convolutional neural networks boosting algorithm</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>08</month>
          <volume>120</volume>
          <fpage>103840</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103840</pub-id>
          <pub-id pub-id-type="medline">34139331</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00169-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Long-term prediction for temporal propagation of seasonal influenza using Transformer-based model</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>10</month>
          <volume>122</volume>
          <fpage>103894</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103894</pub-id>
          <pub-id pub-id-type="medline">34454080</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00223-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Sheng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A novel hierarchical machine learning model for hospital-acquired venous thromboembolism risk assessment among multiple-departments</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>10</month>
          <volume>122</volume>
          <fpage>103892</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00221-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103892</pub-id>
          <pub-id pub-id-type="medline">34454079</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00221-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sow</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Disease network delineates the disease progression profile of cardiovascular diseases</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>03</month>
          <volume>115</volume>
          <fpage>103686</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00015-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103686</pub-id>
          <pub-id pub-id-type="medline">33493631</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00015-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Kaymak</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Deep representation learning for individualized treatment effect estimation using electronic health records</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <month>12</month>
          <volume>100</volume>
          <fpage>103303</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30222-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103303</pub-id>
          <pub-id pub-id-type="medline">31610264</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30222-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dligach</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Afshar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Toward a clinical text encoder: pretraining for clinical natural language processing with applications to substance misuse</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2019</year>
          <month>11</month>
          <day>01</day>
          <volume>26</volume>
          <issue>11</issue>
          <fpage>1272</fpage>
          <lpage>1278</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31233140"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz072</pub-id>
          <pub-id pub-id-type="medline">31233140</pub-id>
          <pub-id pub-id-type="pii">5522436</pub-id>
          <pub-id pub-id-type="pmcid">PMC6798566</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kamal</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>An interpretable risk prediction model for healthcare with pattern attention</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2020</year>
          <month>12</month>
          <day>30</day>
          <volume>20</volume>
          <issue>Suppl 11</issue>
          <fpage>307</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-020-01331-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-020-01331-7</pub-id>
          <pub-id pub-id-type="medline">33380322</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-020-01331-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC7772928</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sarva</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Henchcliffe</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Data-driven subtyping of Parkinson's disease using longitudinal clinical records: A cohort study</article-title>
          <source>Sci Rep</source>
          <year>2019</year>
          <month>01</month>
          <day>28</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>797</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-018-37545-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-018-37545-z</pub-id>
          <pub-id pub-id-type="medline">30692568</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-018-37545-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC6349906</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gandhi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Chandrasekaran</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Turzhitsky</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Bali</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Metzger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>La Rosa</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Weaver</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dexter</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Applying interpretable deep learning models to identify chronic cough patients using EHR data</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2021</year>
          <month>10</month>
          <volume>210</volume>
          <fpage>106395</fpage>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2021.106395</pub-id>
          <pub-id pub-id-type="medline">34525412</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(21)00469-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Long</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Distributed learning from multiple EHR databases: Contextual embedding models for medical events</article-title>
          <source>J Biomed Inform</source>
          <year>2019</year>
          <month>04</month>
          <volume>92</volume>
          <fpage>103138</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30056-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103138</pub-id>
          <pub-id pub-id-type="medline">30825539</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30056-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC6533615</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Barbieri</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kemp</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Perez-Concha</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Kotwal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gallagher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ritchie</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jorm</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Benchmarking deep learning architectures for predicting readmission to the ICU and describing patients-at-risk</article-title>
          <source>Sci Rep</source>
          <year>2020</year>
          <month>01</month>
          <day>24</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>1111</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-020-58053-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-020-58053-z</pub-id>
          <pub-id pub-id-type="medline">31980704</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-020-58053-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC6981230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Steinberg</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fries</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Corbin</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Pfohl</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
          </person-group>
          <article-title>Language models are an effective representation learning technique for electronic health record data</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>01</month>
          <volume>113</volume>
          <fpage>103637</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(20)30265-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2020.103637</pub-id>
          <pub-id pub-id-type="medline">33290879</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(20)30265-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC7863633</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carrasco-Ribelles</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Pardo-Mas</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Tortajada</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sáez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Valdivieso</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>García-Gómez</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Predicting morbidity by local similarities in multi-scale patient trajectories</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>08</month>
          <volume>120</volume>
          <fpage>103837</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103837</pub-id>
          <pub-id pub-id-type="medline">34119690</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00166-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Multi-layer representation learning and its application to electronic health records</article-title>
          <source>Neural Process Lett</source>
          <year>2021</year>
          <volume>53</volume>
          <issue>2</issue>
          <fpage>1417</fpage>
          <lpage>1433</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33623481"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11063-021-10449-2</pub-id>
          <pub-id pub-id-type="medline">33623481</pub-id>
          <pub-id pub-id-type="pii">10449</pub-id>
          <pub-id pub-id-type="pmcid">PMC7891814</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Weight-based multiple empirical kernel learning with neighbor discriminant constraint for heart failure mortality prediction</article-title>
          <source>J Biomed Inform</source>
          <year>2020</year>
          <month>01</month>
          <volume>101</volume>
          <fpage>103340</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(19)30259-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103340</pub-id>
          <pub-id pub-id-type="medline">31756495</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(19)30259-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rongali</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rose</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>McManus</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Bajracharya</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Kapoor</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Granillo</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Learning latent space representations to predict patient outcomes: Model development and validation</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>03</month>
          <day>23</day>
          <volume>22</volume>
          <issue>3</issue>
          <fpage>e16374</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/3/e16374/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/16374</pub-id>
          <pub-id pub-id-type="medline">32202503</pub-id>
          <pub-id pub-id-type="pii">v22i3e16374</pub-id>
          <pub-id pub-id-type="pmcid">PMC7136840</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tahayori</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Chini-Foroush</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Akhlaghi</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Advanced natural language processing technique to predict patient disposition based on emergency triage notes</article-title>
          <source>Emerg Med Australas</source>
          <year>2021</year>
          <volume>33</volume>
          <issue>3</issue>
          <fpage>480</fpage>
          <lpage>484</lpage>
          <pub-id pub-id-type="doi">10.1111/1742-6723.13656</pub-id>
          <pub-id pub-id-type="medline">33043570</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Si</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jim Zheng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Deep representation learning of patient data from Electronic Health Records (EHR): A systematic review</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>03</month>
          <volume>115</volume>
          <fpage>103671</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(20)30299-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2020.103671</pub-id>
          <pub-id pub-id-type="medline">33387683</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(20)30299-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kwon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jeon</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Deep-learning-based risk stratification for mortality of patients with acute myocardial infarction</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <volume>14</volume>
          <issue>10</issue>
          <fpage>e0224502</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0224502"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0224502</pub-id>
          <pub-id pub-id-type="medline">31671144</pub-id>
          <pub-id pub-id-type="pii">PONE-D-19-14012</pub-id>
          <pub-id pub-id-type="pmcid">PMC6822714</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ruan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lei</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhai</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Representation learning for clinical time series prediction tasks in electronic health records</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2019</year>
          <month>12</month>
          <day>17</day>
          <volume>19</volume>
          <issue>Suppl 8</issue>
          <fpage>259</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-019-0985-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-019-0985-7</pub-id>
          <pub-id pub-id-type="medline">31842854</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-019-0985-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC6916209</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Papapetrou</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Asker</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Boström</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Learning from heterogeneous temporal data in electronic health records</article-title>
          <source>J Biomed Inform</source>
          <year>2017</year>
          <month>01</month>
          <volume>65</volume>
          <fpage>105</fpage>
          <lpage>119</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(16)30165-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2016.11.006</pub-id>
          <pub-id pub-id-type="medline">27919732</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(16)30165-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Morid</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Sheng</surname>
              <given-names>ORL</given-names>
            </name>
            <name name-style="western">
              <surname>Kawamoto</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Abdelrahman</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Learning hidden patterns from patient multivariate time series data using convolutional neural networks: A case study of healthcare cost prediction</article-title>
          <source>J Biomed Inform</source>
          <year>2020</year>
          <month>11</month>
          <volume>111</volume>
          <fpage>103565</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(20)30193-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2020.103565</pub-id>
          <pub-id pub-id-type="medline">32980530</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(20)30193-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Distributed representations of words and phrases and their compositionality</article-title>
          <source>NIPS'13: Proceedings of the 26th International Conference on Neural Information Processing Systems - Volume 2</source>
          <year>2013</year>
          <conf-name>26th International Conference on Neural Information Processing Systems</conf-name>
          <conf-date>December 5-10, 2013</conf-date>
          <conf-loc>Lake Tahoe, Nevada</conf-loc>
          <fpage>3111</fpage>
          <lpage>3119</lpage>
          <pub-id pub-id-type="doi">10.5555/2999792.2999959</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Miotto</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Shameer</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dudley</surname>
              <given-names>JT</given-names>
            </name>
          </person-group>
          <article-title>Automated disease cohort selection using word embeddings from Electronic Health Records</article-title>
          <source>Pac Symp Biocomput</source>
          <year>2018</year>
          <volume>23</volume>
          <fpage>145</fpage>
          <lpage>156</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://psb.stanford.edu/psb-online/proceedings/psb18/abstracts/2018_p145.html"/>
          </comment>
          <pub-id pub-id-type="medline">29218877</pub-id>
          <pub-id pub-id-type="pii">9789813235533_0014</pub-id>
          <pub-id pub-id-type="pmcid">PMC5788312</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Prediction task guided representation learning of medical codes in EHR</article-title>
          <source>J Biomed Inform</source>
          <year>2018</year>
          <month>08</month>
          <volume>84</volume>
          <fpage>1</fpage>
          <lpage>10</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(18)30119-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2018.06.013</pub-id>
          <pub-id pub-id-type="medline">29928997</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(18)30119-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Fei</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Patient representation from structured electronic medical records based on embedding technique: Development and validation study</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>07</month>
          <day>23</day>
          <volume>9</volume>
          <issue>7</issue>
          <fpage>e19905</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/7/e19905/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/19905</pub-id>
          <pub-id pub-id-type="medline">34297000</pub-id>
          <pub-id pub-id-type="pii">v9i7e19905</pub-id>
          <pub-id pub-id-type="pmcid">PMC8367145</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Geographic variations in in‐hospital mortality and use of percutaneous coronary intervention following acute myocardial infarction in China: A nationwide cross‐sectional analysis</article-title>
          <source>J Am Heart Assoc</source>
          <year>2018</year>
          <month>04</month>
          <day>17</day>
          <volume>7</volume>
          <issue>8</issue>
          <fpage>52</fpage>
          <lpage>62</lpage>
          <pub-id pub-id-type="doi">10.1161/JAHA.117.008131</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>GBD 2013 Mortality Causes of Death Collaborators</collab>
          </person-group>
          <article-title>Global, regional, and national age–sex specific all-cause and cause-specific mortality for 240 causes of death, 1990–2013: a systematic analysis for the Global Burden of Disease Study 2013</article-title>
          <source>The Lancet</source>
          <year>2015</year>
          <month>01</month>
          <day>10</day>
          <volume>385</volume>
          <issue>9963</issue>
          <fpage>117</fpage>
          <lpage>171</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25530442"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(14)61682-2</pub-id>
          <pub-id pub-id-type="medline">25530442</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(14)61682-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC4340604</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Choe</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Cha</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jeong</surname>
              <given-names>MH</given-names>
            </name>
            <collab>Korea Acute Myocardial Infarction Registry (KAMIR) Korea Working Group on Myocardial Infarction (KorMI) Investigators</collab>
          </person-group>
          <article-title>Prediction of 1-year mortality from acute myocardial infarction using machine learning</article-title>
          <source>Am J Cardiol</source>
          <year>2020</year>
          <month>10</month>
          <day>15</day>
          <volume>133</volume>
          <fpage>23</fpage>
          <lpage>31</lpage>
          <pub-id pub-id-type="doi">10.1016/j.amjcard.2020.07.048</pub-id>
          <pub-id pub-id-type="medline">32811651</pub-id>
          <pub-id pub-id-type="pii">S0002-9149(20)30783-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aziz</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Malek</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ibrahim</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Raja Shariff</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Wan Ahmad</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>KT</given-names>
            </name>
            <name name-style="western">
              <surname>Selvaraj</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kasim</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Short- and long-term mortality prediction after an acute ST-elevation myocardial infarction (STEMI) in Asians: A machine learning approach</article-title>
          <source>PLoS One</source>
          <year>2021</year>
          <volume>16</volume>
          <issue>8</issue>
          <fpage>e0254894</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0254894"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0254894</pub-id>
          <pub-id pub-id-type="medline">34339432</pub-id>
          <pub-id pub-id-type="pii">PONE-D-21-01510</pub-id>
          <pub-id pub-id-type="pmcid">PMC8328310</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Nomograms based on pre-operative parametric for prediction of short-term mortality in acute myocardial infarction patients treated invasively</article-title>
          <source>Aging (Albany NY)</source>
          <year>2020</year>
          <month>12</month>
          <day>11</day>
          <volume>13</volume>
          <issue>2</issue>
          <fpage>2184</fpage>
          <lpage>2197</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.impactaging.com/full/13/2184"/>
          </comment>
          <pub-id pub-id-type="doi">10.18632/aging.202230</pub-id>
          <pub-id pub-id-type="medline">33323557</pub-id>
          <pub-id pub-id-type="pii">202230</pub-id>
          <pub-id pub-id-type="pmcid">PMC7880403</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SI</given-names>
            </name>
          </person-group>
          <article-title>A unified approach to interpreting model predictions</article-title>
          <source>NIPS'17: Proceedings of the 31st International Conference on Neural Information Processing Systems</source>
          <year>2017</year>
          <conf-name>31st International Conference on Neural Information Processing Systems</conf-name>
          <conf-date>December 4-9, 2017</conf-date>
          <conf-loc>Long Beach, California</conf-loc>
          <fpage>4768</fpage>
          <lpage>4777</lpage>
          <pub-id pub-id-type="doi">10.5555/3295222</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <source>Medical Information Mart for Intensive Care</source>
          <access-date>2022-07-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mimic.mit.edu/">https://mimic.mit.edu/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Fei</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Sequential data-based patient similarity framework for patient outcome prediction: Algorithm development</article-title>
          <source>J Med Internet Res</source>
          <year>2022</year>
          <month>01</month>
          <day>06</day>
          <volume>24</volume>
          <issue>1</issue>
          <fpage>e30720</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2022/1/e30720/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/30720</pub-id>
          <pub-id pub-id-type="medline">34989682</pub-id>
          <pub-id pub-id-type="pii">v24i1e30720</pub-id>
          <pub-id pub-id-type="pmcid">PMC8778569</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Grant</surname>
              <given-names>PW</given-names>
            </name>
          </person-group>
          <article-title>Robust clustering by detecting density peaks and assigning points based on fuzzy weighted K-nearest neighbors</article-title>
          <source>Information Sciences</source>
          <year>2016</year>
          <month>08</month>
          <volume>354</volume>
          <fpage>19</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ins.2016.03.011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>EHR2Vec: Representation learning of medical concepts from temporal patterns of clinical notes based on self-attention mechanism</article-title>
          <source>Front Genet</source>
          <year>2020</year>
          <volume>11</volume>
          <fpage>630</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fgene.2020.00630"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fgene.2020.00630</pub-id>
          <pub-id pub-id-type="medline">32714371</pub-id>
          <pub-id pub-id-type="pmcid">PMC7344186</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chanda</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Egleston</surname>
              <given-names>BL</given-names>
            </name>
            <name name-style="western">
              <surname>Vucetic</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>EHR phenotyping via jointly embedding medical concepts and words into a unified vector space</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2018</year>
          <month>12</month>
          <day>12</day>
          <volume>18</volume>
          <issue>Suppl 4</issue>
          <fpage>123</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-018-0672-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-018-0672-0</pub-id>
          <pub-id pub-id-type="medline">30537974</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-018-0672-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6290514</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miotto</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kidd</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Dudley</surname>
              <given-names>JT</given-names>
            </name>
          </person-group>
          <article-title>Deep patient: An unsupervised representation to predict the future of patients from the electronic health records</article-title>
          <source>Sci Rep</source>
          <year>2016</year>
          <month>05</month>
          <day>17</day>
          <volume>6</volume>
          <fpage>26094</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/srep26094"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/srep26094</pub-id>
          <pub-id pub-id-type="medline">27185194</pub-id>
          <pub-id pub-id-type="pii">srep26094</pub-id>
          <pub-id pub-id-type="pmcid">PMC4869115</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Combining structured and unstructured data for predictive models: a deep learning approach</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2020</year>
          <month>10</month>
          <day>29</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>280</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-020-01297-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-020-01297-6</pub-id>
          <pub-id pub-id-type="medline">33121479</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-020-01297-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7596962</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Explainable dynamic multimodal variational autoencoder for the prediction of patients with suspected central precocious puberty</article-title>
          <source>IEEE J. Biomed. Health Inform</source>
          <year>2022</year>
          <month>3</month>
          <volume>26</volume>
          <issue>3</issue>
          <fpage>1362</fpage>
          <lpage>1373</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2021.3103271</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Schuetz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>WF</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Medical concept representation learning from electronic health records and its application on heart failure prediction</article-title>
          <source>arXiv</source>
          <year>2016</year>
          <access-date>2022-07-19</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1602.03686">https://arxiv.org/abs/1602.03686</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gromicho</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>de Carvalho</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Madeira</surname>
              <given-names>SC</given-names>
            </name>
          </person-group>
          <article-title>Explainable models of disease progression in ALS: Learning from longitudinal clinical data with recurrent neural networks and deep model explanation</article-title>
          <source>Computer Methods and Programs in Biomedicine Update</source>
          <year>2021</year>
          <volume>1</volume>
          <fpage>100018</fpage>
          <pub-id pub-id-type="doi">10.1016/j.cmpbup.2021.100018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Erion</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>DeGrave</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Prutkin</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Nair</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Katz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Himmelfarb</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bansal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>From local explanations to global understanding with explainable AI for trees</article-title>
          <source>Nat Mach Intell</source>
          <year>2020</year>
          <month>01</month>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>56</fpage>
          <lpage>67</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32607472"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s42256-019-0138-9</pub-id>
          <pub-id pub-id-type="medline">32607472</pub-id>
          <pub-id pub-id-type="pmcid">PMC7326367</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Nair</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Vavilala</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Horibe</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Eisses</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Liston</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Low</surname>
              <given-names>DKW</given-names>
            </name>
            <name name-style="western">
              <surname>Newman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Explainable machine-learning predictions for the prevention of hypoxaemia during surgery</article-title>
          <source>Nat Biomed Eng</source>
          <year>2018</year>
          <month>10</month>
          <volume>2</volume>
          <issue>10</issue>
          <fpage>749</fpage>
          <lpage>760</lpage>
          <pub-id pub-id-type="doi">10.1038/s41551-018-0304-0</pub-id>
          <pub-id pub-id-type="medline">31001455</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41551-018-0304-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6467492</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pinto</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Grandin</surname>
              <given-names>EW</given-names>
            </name>
          </person-group>
          <article-title>Risk prediction in AMI shock: Goldilocks and the search for "just right"</article-title>
          <source>J Am Coll Cardiol</source>
          <year>2017</year>
          <month>04</month>
          <day>18</day>
          <volume>69</volume>
          <issue>15</issue>
          <fpage>1921</fpage>
          <lpage>1923</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0735-1097(17)30674-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jacc.2017.02.024</pub-id>
          <pub-id pub-id-type="medline">28408021</pub-id>
          <pub-id pub-id-type="pii">S0735-1097(17)30674-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yeh</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Sidney</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chandra</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sorel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Selby</surname>
              <given-names>JV</given-names>
            </name>
            <name name-style="western">
              <surname>Go</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>Population trends in the incidence and outcomes of acute myocardial infarction</article-title>
          <source>N Engl J Med</source>
          <year>2010</year>
          <month>06</month>
          <day>10</day>
          <volume>362</volume>
          <issue>23</issue>
          <fpage>2155</fpage>
          <lpage>2165</lpage>
          <pub-id pub-id-type="doi">10.1056/nejmoa0908610</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shroff</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Frederick</surname>
              <given-names>PD</given-names>
            </name>
            <name name-style="western">
              <surname>Herzog</surname>
              <given-names>CA</given-names>
            </name>
          </person-group>
          <article-title>Renal failure and acute myocardial infarction: clinical characteristics in patients with advanced chronic kidney disease, on dialysis, and without chronic kidney disease. A collaborative project of the United States Renal Data System/National Institutes of Health and the National Registry of Myocardial Infarction</article-title>
          <source>Am Heart J</source>
          <year>2012</year>
          <month>03</month>
          <volume>163</volume>
          <issue>3</issue>
          <fpage>399</fpage>
          <lpage>406</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22424010"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ahj.2011.12.002</pub-id>
          <pub-id pub-id-type="medline">22424010</pub-id>
          <pub-id pub-id-type="pii">S0002-8703(11)00883-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC3313453</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>D'Ascenzo</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>De Filippo</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Gallone</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Mittone</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Deriu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Iannaccone</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ariza-Solé</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Liebetrau</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Manzano-Fernández</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Quadri</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kinnaird</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Campo</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Simao Henriques</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hughes</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dominguez-Rodriguez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Aldinucci</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Morbiducci</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Patti</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Raposeiras-Roubin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Abu-Assi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>De Ferrari</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Piroli</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Saglietto</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Conrotto</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Omedé</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Montefusco</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pennone</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bruno</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Bocchino</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Boccuzzi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cerrato</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Varbella</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Sperti</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wilton</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Velicki</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xanthopoulou</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cequier</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Iniguez-Romo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Munoz Pousa</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cespon Fernandez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Caneiro Queija</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Cobas-Paz</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lopez-Cuenca</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Garay</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Blanco</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rognoni</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Biondi Zoccai</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Biscaglia</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nunez-Gil</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Fujii</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Durante</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Kawaji</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Alexopoulos</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Huczek</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez Juanatey</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nie</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kawashiri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Colonnelli</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cantalupo</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Esposito</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Leonardi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Grosso Marra</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Chieffo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Michelucci</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Piga</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Malavolta</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gili</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mennuni</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Montalto</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Oltrona Visconti</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Arfat</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Machine learning-based prediction of adverse events following an acute coronary syndrome (PRAISE): a modelling study of pooled datasets</article-title>
          <source>The Lancet</source>
          <year>2021</year>
          <month>01</month>
          <volume>397</volume>
          <issue>10270</issue>
          <fpage>199</fpage>
          <lpage>207</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(20)32519-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rasmy</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhi</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Med-BERT: pretrained contextualized embeddings on large-scale structured electronic health records for disease prediction</article-title>
          <source>NPJ Digit Med</source>
          <year>2021</year>
          <month>05</month>
          <day>20</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>86</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-021-00455-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-021-00455-y</pub-id>
          <pub-id pub-id-type="medline">34017034</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-021-00455-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC8137882</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
