<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id><journal-id journal-id-type="publisher-id">jmir</journal-id><journal-id journal-id-type="index">1</journal-id><journal-title>Journal of Medical Internet Research</journal-title><abbrev-journal-title>J Med Internet Res</abbrev-journal-title><issn pub-type="epub">1438-8871</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v28i1e77809</article-id><article-id pub-id-type="doi">10.2196/77809</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Detection of Antithrombotic-Related Bleeding in Older Inpatients: Multicenter Retrospective Study Using Structured and Unstructured Electronic Health Record Data</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Coumau</surname><given-names>Claire</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Gaspar</surname><given-names>Frederic</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zayene</surname><given-names>Mehdi</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Bertrand</surname><given-names>Elliott</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Alberio</surname><given-names>Lorenzo</given-names></name><degrees>Prof Dr Med</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lovis</surname><given-names>Christian</given-names></name><degrees>Prof Dr Med</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Beeler</surname><given-names>Patrick E</given-names></name><degrees>PD Dr med</degrees><xref ref-type="aff" rid="aff7">7</xref><xref ref-type="aff" rid="aff8">8</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Rinaldi</surname><given-names>Fabio</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff9">9</xref><xref ref-type="aff" rid="aff10">10</xref><xref ref-type="aff" rid="aff11">11</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lutters</surname><given-names>Monika</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff12">12</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Le Pogam</surname><given-names>Marie-Annick</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff13">13</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Csajka</surname><given-names>Chantal</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><collab>SwissMADE Collaborators</collab><xref ref-type="aff" rid="aff14">14</xref><xref ref-type="aff" rid="aff17">17</xref></contrib></contrib-group><aff id="aff1"><institution>Center for Research and Innovation in Clinical Pharmaceutical Sciences, Lausanne University Hospital and University of Lausanne</institution><addr-line>Rue du Bugnon 19</addr-line><addr-line>Lausanne</addr-line><country>Switzerland</country></aff><aff id="aff2"><institution>School of Pharmaceutical Sciences, University of Geneva</institution><addr-line>Geneva</addr-line><country>Switzerland</country></aff><aff id="aff3"><institution>Institute of Pharmaceutical Sciences of Western Switzerland, University of Geneva</institution><addr-line>Geneva</addr-line><country>Switzerland</country></aff><aff id="aff4"><institution>Artefact Company</institution><addr-line>Lausanne</addr-line><country>Switzerland</country></aff><aff id="aff5"><institution>Service of Haematology and Central Haematology Laboratory, Lausanne University Hospital and University of Lausanne</institution><addr-line>Lausanne</addr-line><country>Switzerland</country></aff><aff id="aff6"><institution>Division of Medical Information Sciences, Geneva University Hospitals and University of Geneva</institution><addr-line>Geneva</addr-line><country>Switzerland</country></aff><aff id="aff7"><institution>Division of Occupational and Environmental Medicine, Epidemiology, Biostatistics and Prevention Institute, University of Zurich and University Hospital Zurich</institution><addr-line>Zurich</addr-line><country>Switzerland</country></aff><aff id="aff8"><institution>Center for Clinical Research, University of Lucerne</institution><addr-line>Lucerne</addr-line><country>Switzerland</country></aff><aff id="aff9"><institution>Dalle Molle Institute for Artificial Intelligence Research, IDSIA USI-SUPSI</institution><addr-line>Lugano</addr-line><country>Switzerland</country></aff><aff id="aff10"><institution>SIB Swiss Institute of Bioinformatics</institution><addr-line>Lausanne</addr-line><country>Switzerland</country></aff><aff id="aff11"><institution>Faculty of Biology and Medicine, Fondazione Bruno Kessler</institution><addr-line>Trento</addr-line><country>Italy</country></aff><aff id="aff12"><institution>Head of Hospital Pharmacy, Kantonsspital Aarau</institution><addr-line>Aarau</addr-line><country>Switzerland</country></aff><aff id="aff13"><institution>Department of Epidemiology and Health Systems, Unisant&#x00E9;, University Center for Primary Care and Public Health &#x0026; University of Lausanne</institution><addr-line>Lausanne</addr-line><country>Switzerland</country></aff><aff id="aff14"><institution>See Acknowledgments</institution></aff><aff id="aff17">Burnand Bernard, Lang Pierre Olivier, Colic Nicola, Schulthess-Lisibach Angela, Gaudet-Blavignac Christophe, Casati Nathalie, Goldman Jean-Philippe, Foufi Vasiliki</aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Schwartz</surname><given-names>Amy</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Forgerini</surname><given-names>Marcela</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Sazzad</surname><given-names>Sadman</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Modebelu</surname><given-names>Ukamaka</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Chantal Csajka, Prof Dr, Center for Research and Innovation in Clinical Pharmaceutical Sciences, Lausanne University Hospital and University of Lausanne, Rue du Bugnon 19, Lausanne, Switzerland, 1 021 314 42 63; <email>Chantal.Csajka@chuv.ch</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>29</day><month>1</month><year>2026</year></pub-date><volume>28</volume><elocation-id>e77809</elocation-id><history><date date-type="received"><day>20</day><month>05</month><year>2025</year></date><date date-type="rev-recd"><day>18</day><month>11</month><year>2025</year></date><date date-type="accepted"><day>27</day><month>11</month><year>2025</year></date></history><copyright-statement>&#x00A9; Claire Coumau, Frederic Gaspar, Mehdi Zayene, Elliott Bertrand, Lorenzo Alberio, Christian Lovis, Patrick E Beeler, Fabio Rinaldi, Monika Lutters, Marie-Annick Le Pogam, Chantal Csajka, SwissMADE Collaborators. Originally published in the Journal of Medical Internet Research (<ext-link ext-link-type="uri" xlink:href="https://www.jmir.org">https://www.jmir.org</ext-link>), 29.1.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.jmir.org/">https://www.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.jmir.org/2026/1/e77809"/><abstract><sec><title>Background</title><p>Bleeding complications are a major contributor to adverse drug events among older inpatients, particularly in those treated with antithrombotic agents. Timely and accurate detection of bleeding events is essential for improving drug safety surveillance and clinical risk management.</p></sec><sec><title>Objective</title><p>The study aimed to develop and validate automated algorithms for detecting major bleeding (MB) and clinically relevant nonmajor bleeding (CRNMB) events from electronic medical records (EMRs) by combining structured data-based rule models and a natural language processing (NLP) approach, and to evaluate their performance and generalizability against a manually reviewed gold standard and an external dataset.</p></sec><sec sec-type="methods"><title>Methods</title><p>We conducted a multicenter retrospective study using routinely collected EMR data from 3 Swiss university hospitals. Patients 65 years or older who received at least one antithrombotic agent and were hospitalized between January 2015 and December 2016 were included. To detect MB and CRNMB events, rule-based algorithms were developed using structured data (<italic>International Statistical Classification of Diseases, 10th Revision, German Modification</italic> [<italic>ICD-10-GM</italic>] codes, laboratory values, transfusion records, and antihemorrhagic prescriptions), with variables and cutoff values defined according to adapted International Society on Thrombosis and Haemostasis definitions and expert consensus. In parallel, a supervised NLP model was applied to discharge summaries from one hospital. A manual review of 754 EMRs served as the reference standard for internal validation, and the algorithm performance of the structured data algorithms (SDA), NLP, and their combination (SDA+NLP) was evaluated against this manually reviewed gold standard using standard performance metrics. External validation was performed on an independent dataset from the Lausanne University Hospital to assess model robustness and generalizability.</p></sec><sec sec-type="results"><title>Results</title><p>Among 36,039 inpatient stays, SDA identified 8.26% (n=2979) as MB and 15.04% (n=5419) as CRNMB cases. <italic>ICD-10-GM</italic> codes alone detected 28.5% (n=849) of MB and 31.48% (n=1706) of CRNMB cases, while laboratory data contributed most to event detection (n=1994, 66.94% for MB and n=3663, 67.60% for CRNMB). Integrating SDA with NLP improved detection, identifying 12.2% (920/7513) of MB and 27.4% (2062/7513) of CRNMB cases at 1 hospital. The combined model achieved the best performance (sensitivity 0.84, positive predictive value 0.51, <italic>F</italic><sub>1</sub>-score 0.64). External validation on Lausanne University Hospital 2021&#x2010;2022 data (n=24,054 stays) confirmed the algorithms&#x2019; reproducibility; the prevalence of MB decreased while CRNMB increased, reflecting evolving clinical practices and antithrombotic use patterns.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Our integrated approach, combining SDA with NLP, enhances the detection of hemorrhagic events in older hospitalized patients treated with antithrombotic agents, suggesting its potential usefulness for drug safety monitoring and clinical risk management.</p></sec><sec sec-type="registered-report"><title>International Registered Report Identifier (IRRID)</title><p>RR2-10.2196/40456</p></sec></abstract><kwd-group><kwd>adverse drug events</kwd><kwd>adverse drug reactions</kwd><kwd>older inpatients</kwd><kwd>structured data mining</kwd><kwd>machine learning</kwd><kwd>natural language processing</kwd><kwd>electronic medical records</kwd><kwd>multicenter study</kwd><kwd>antithrombotic</kwd><kwd>hemorrhage</kwd><kwd>artificial intelligence</kwd><kwd>pharmacovigilance</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Over 16% of older inpatients experience at least 1 adverse drug event (ADE) during their hospital stay [<xref ref-type="bibr" rid="ref1">1</xref>], often with more severe consequences than in younger patients [<xref ref-type="bibr" rid="ref2">2</xref>]. Among the medications most frequently implicated, antithrombotic agents, widely prescribed in older adults for the prevention and treatment of cardiovascular disease, stand out as a major cause of bleeding-related ADEs [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Hemorrhagic complications represent a substantial share of drug-related harm in this population and are associated with longer hospital stays, higher readmission rates, and increased mortality. Continuous and accurate measurement of these events is therefore essential to inform prevention strategies, strengthen pharmacovigilance, and promote safer antithrombotic use in clinical practice.</p><p>Various approaches have been developed to detect ADEs in hospital settings, each with advantages and limitations. Spontaneous reporting systems, though simple to implement, notoriously underestimate the true frequency of ADEs due to underreporting [<xref ref-type="bibr" rid="ref4">4</xref>]. Systematic chart reviews of electronic medical records (EMRs), often considered the reference standard, provide detailed clinical information but are too resource- and time-intensive for routine surveillance [<xref ref-type="bibr" rid="ref5">5</xref>]. To overcome these constraints, automated detection methods using routinely collected EMR data have emerged. These approaches leverage both structured data, such as diagnostic codes, medication records, laboratory results, and vital signs, and unstructured clinical narratives, including discharge summaries, progress notes, and consultation reports. Structured data are accessible and standardized, supporting large-scale analyses but may lack contextual nuances needed to capture complex clinical events such as bleeding [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. Conversely, textual data, although unstructured, often contain richer clinical detail but require advanced computational methods for analysis. Recent advances in machine learning (ML) and natural language processing (NLP) have markedly improved the ability to extract this information and are increasingly applied to pharmacovigilance and ADE detection [<xref ref-type="bibr" rid="ref9">9</xref>]. Integrating both structured and textual data appears particularly promising for identifying bleeding events, potentially enhancing accuracy and completeness [<xref ref-type="bibr" rid="ref10">10</xref>].</p><p>Despite growing interest in automated ADE detection to support drug safety monitoring, important knowledge gaps remain, particularly in the Swiss context. Most existing studies focusing on bleeding events have relied exclusively on either structured or unstructured data [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref15">15</xref>], have prioritized prediction rather than detection [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref16">16</xref>], or have focused on specific bleeding types or patient groups [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref19">19</xref>]. Furthermore, clear operational definitions distinguishing major bleeding (MB) from clinically relevant nonmajor bleeding (CRNMB) are often lacking, limiting comparability across studies [<xref ref-type="bibr" rid="ref20">20</xref>]. To date, no study in Switzerland has comprehensively evaluated the combined contribution of structured and textual data for ADE detection in a general inpatient population receiving antithrombotic therapy. To address this gap, we conducted a multicenter study integrating rule-based algorithms and NLP to detect MB and CRNMB events among older inpatients treated with antithrombotics. We hypothesized that combining structured and textual EMR data would improve the accuracy and completeness of bleeding event identification compared with using either data source alone. The study aimed to develop rule-based algorithms for bleeding detection from structured data sources (diagnoses, laboratory results, transfusions, and antihemorrhagic prescriptions) based on international definitions; design and train an NLP model to identify bleeding mentions in discharge summaries; assess and compare the diagnostic performance of structured data algorithms (SDA), NLP, and their combination (SDA+NLP) against a manually reviewed gold standard; and evaluate the generalizability of the best-performing models through external validation on an independent dataset.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design</title><p>We conducted a multicenter cross-sectional study using retrospective data covering the period from January 1, 2015, to December 31, 2016. Data were obtained from 4 large Swiss hospitals: Lausanne University Hospital (CHUV; approximately 1500 beds [<xref ref-type="bibr" rid="ref21">21</xref>]), Geneva University Hospital (HUG; approximately 2000 beds [<xref ref-type="bibr" rid="ref22">22</xref>]), both located in the French-speaking region and serving the cantons of Vaud and Geneva, respectively, Z&#x00FC;rich University Hospital (USZ; approximately 900 beds [<xref ref-type="bibr" rid="ref23">23</xref>]) serving the Zurich metropolitan area, and Baden Cantonal Hospital (KSB; approximately 400 beds [<xref ref-type="bibr" rid="ref24">24</xref>]) serving the canton of Aargau in the German-speaking region. This study was conducted in accordance with the SRTOBE (Strengthening the Reporting of Observational Studies in Epidemiology) statement (<xref ref-type="supplementary-material" rid="app7">Checklist 1</xref>).</p><p>The 2015&#x2010;2016 dataset was used for algorithm development as it was the most recent period with harmonized, high-quality structured and unstructured EMR data across all hospitals. Later years were excluded due to EMR vendor transitions, database restructuring, and new data-governance restrictions limiting access to deidentified text. A more recent CHUV dataset (2021&#x2010;2022) was used for temporal and external validation to test algorithm robustness under evolving clinical practices and documentation standards.</p></sec><sec id="s2-2"><title>Study Participants and Hospital Stays</title><p>Eligible participants were Swiss residents 65 years or older treated with at least 1 antithrombotic agent during their hospital stay. Antithrombotic agents included vitamin K antagonists, heparins, platelet aggregation inhibitors, direct thrombin inhibitors, direct factor Xa inhibitors, or fondaparinux. Hospitalizations had to last at least 24 hours and to occur between January 2015 and December 2016 (test dataset). For the external validation, an additional dataset from CHUV covering January 2021 to December 2022 was used (validation dataset). Only patients who had provided explicit consent for the reuse of their health data for research purposes, as indicated by the signature of the general consent form, were eligible for inclusion. Hospital stays lasting less than 24 hours were excluded from the analysis.</p></sec><sec id="s2-3"><title>Data Sources and Preprocessing</title><p>Each participating hospital extracted relevant clinical data from its institutional data warehouses for all inpatient stays meeting the inclusion criteria. The extracted datasets included both structured and unstructured data. Structured data comprised administrative information, patient movements within the hospital, key clinical and laboratory parameters, and prescribed medications coded using the anatomical therapeutic chemical classification. Diagnostic codes were drawn from the <italic>International Statistical Classification of Diseases, 10th Revision, German Modification</italic> (<italic>ICD-10-GM</italic>), and procedures were coded according to the Swiss Classification of Surgical Procedures (CHOP). Diagnoses and procedures were obtained from the hospital billing records associated with each inpatient stay. Unstructured data included discharge summaries. Further details on data extraction and handling are available in the published study protocol [<xref ref-type="bibr" rid="ref25">25</xref>].</p><p>Prior to analysis, structured data were cleaned, harmonized, and verified for consistency at each site, then locally deidentified before being transferred to a centralized database hosted at CHUV. Unstructured data were deidentified and, where necessary, converted into machine-readable formats, but were stored locally on secure hospital servers to comply with data governance policies. Due to the extent of missing and inconsistent information, such as discrepancies in data structure, coding systems, variable definitions, and extensive missing values, reliable harmonization of KSB data with the other hospitals was not feasible, and data from KSB were excluded from the analysis. In addition, only unstructured data from CHUV were analyzed, as full deidentification of textual data from the other sites could not be ensured. The same preprocessing workflow was applied to the 2021&#x2010;2022 CHUV dataset used for external validation. An overview of the data processing workflow is provided in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Overview of the data extraction and preprocessing pipeline for structured and unstructured electronic medical record (EMR) data. CHOP: Swiss Classification of Surgical Procedures; CHUV: Lausanne University Hospital; <italic>ICD-10-GM</italic>: <italic>International Statistical Classification of Diseases, 10th Revision, German Modification</italic>.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e77809_fig01.png"/></fig></sec><sec id="s2-4"><title>Bleeding Detection Algorithms</title><p>We selected variables of interest and cutoff values for our algorithms based on an adaptation of the International Society on Thrombosis and Haemostasis (ISTH) definitions of MB [<xref ref-type="bibr" rid="ref26">26</xref>] and CRNMB [<xref ref-type="bibr" rid="ref27">27</xref>], informed by an extensive review of international guidelines (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). MB was defined as a hemoglobin drop of 4 g/dL or more within 48 hours, a 2 to 4 g/dL drop associated with death within 24 hours, a hemoglobin level less than 7 g/dL, a hemoglobin level between 7 and 9 g/dL associated with death within 24 hours, or a transfusion of more than 5 units of blood or red blood cells. CRNMB was defined as a hemoglobin drop of 2 to 4 g/dL within 48 hours not associated with death or a hemoglobin nadir between 7 and 9 g/dL without subsequent death. The ISTH hemoglobin thresholds were adapted to improve specificity in older inpatients and to reduce the risk of misclassifying nonhemorrhagic anemias. The 5-unit transfusion threshold was pragmatically chosen due to the limited granularity of CHOP procedural codes. Additional structured indicators were also integrated to refine case classification: the prescription of antihemorrhagic agents (idarucizumab, andexanet alfa, prothromplex, octaplex, and beriplex) was considered indicative of MB. MB-related in-hospital mortality was defined as any hospital stay involving at least 1 MB event followed by death during the same admission. We then developed rule-based algorithms using Boolean logic to detect MB and CRNMB cases from structured data (<xref ref-type="fig" rid="figure2">Figure 2</xref>).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Algorithmic framework for detection of major bleeding (MB) and nonmajor clinically relevant bleeding (CRNMB) cases using structured data. Antihemorrhagic agent: idarucizumab, andexanet alfa, prothromplex, octaplex, and beriplex. &#x2206;Hb: drop in hemoglobin levels within 48 hours; <italic>ICD-10-GM</italic>: <italic>International Statistical Classification of Diseases, 10th Revision, German Modification</italic>; Min Hb: minimum hemoglobin value during the stay.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e77809_fig02.png"/></fig><p>The <italic>ICD-10-GM</italic> list comprised 12 codes for MB and 41 codes for CRNMB (<xref ref-type="table" rid="table1">Table 1</xref>). We defined an MB in-hospital mortality case as a stay containing an MB occurring during hospitalization followed by death of the patient during the same hospitalization period. We measure the prevalence of bleeding cases, corresponding to inpatient stays with at least 1 MB or CRNMB event, either present on admission or occurring during hospitalization. We quantified the relative and absolute contribution of each structured data source (diagnoses, laboratory, transfusions, and medications), both individually and in combination, in terms of overall detection capacity and proportion of identified bleeding events.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Lists of deficient systems/organs and distribution of <italic>ICD-10-GM</italic><sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> chapters and codes identifying MB<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> and CRNMB<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup> cases.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">Types of hemorrhagic events</td><td align="left" valign="top"><italic>ICD-10-GM</italic> codes</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="2">MB</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hyphema</td><td align="left" valign="top">H21.0</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hemorrhage and rupture of the choroid</td><td align="left" valign="top">H31.3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Retinal, vitreous, or subarachnoid hemorrhage</td><td align="left" valign="top">H35.6, H43.1, I60_</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hemopericardium not classified elsewhere</td><td align="left" valign="top">I31.2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Intracerebral hemorrhage</td><td align="left" valign="top">I61_</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Other nontraumatic intracranial hemorrhages</td><td align="left" valign="top">I62_</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hemoperitoneum</td><td align="left" valign="top">K66.1</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hemarthrosis</td><td align="left" valign="top">M25.0_</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hypovolemic shock</td><td align="left" valign="top">R57.1</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Shock during or after a procedure for diagnostic and therapeutic purposes, not classified elsewhere</td><td align="left" valign="top">T81.1</td></tr><tr><td align="left" valign="top" colspan="2">CRNMB</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Conjunctival hemorrhage</td><td align="left" valign="top">H11.3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Otorrhagia</td><td align="left" valign="top">H92.2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hemorrhagic esophageal varices</td><td align="left" valign="top">I85.0, I98.3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Other specified diseases of the esophagus</td><td align="left" valign="top">K22.8</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Non-traumatic hemothorax</td><td align="left" valign="top">J94.2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Gastric, duodenal, or gastrojejunal ulcer with hemorrhage and/or perforation</td><td align="left" valign="top">K25.0, K25.2, K25.6, K26.0, K26.2, K26.4, K26.6, K27.0, K27.2, K27.4, K27.6, K28.0, K28.2, K28.4, K28.6</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Acute hemorrhagic gastritis</td><td align="left" valign="top">K29.0</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Rectal and anal hemorrhage</td><td align="left" valign="top">K62.5</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hematemesis</td><td align="left" valign="top">K92.0</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Melena</td><td align="left" valign="top">K92.1</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unspecified gastrointestinal hemorrhage</td><td align="left" valign="top">K92.2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Prostatic congestion and hemorrhage</td><td align="left" valign="top">N42.1</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hematoma of the broad ligament</td><td align="left" valign="top">N83.7</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hematometra</td><td align="left" valign="top">N85.7</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Abnormal bleeding from the uterus and vagina</td><td align="left" valign="top">N93.8, N93.9</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Postmenopausal bleeding</td><td align="left" valign="top">N95.0</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Epistaxis</td><td align="left" valign="top">R04.0</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Throat hemorrhage</td><td align="left" valign="top">R04.1</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hemoptysis</td><td align="left" valign="top">R04.2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Respiratory tract hemorrhage</td><td align="left" valign="top">R04.8, R04.9</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Spontaneous ecchymosis</td><td align="left" valign="top">R23.3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unspecified hematuria</td><td align="left" valign="top">R31</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hemorrhage, not classified elsewhere</td><td align="left" valign="top">R58, T81.0</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup><italic>ICD-10-GM</italic>: <italic>International Classification of Diseases, 10th Revision, German Modification</italic>.</p></fn><fn id="table1fn2"><p><sup>b</sup>MB: major bleeding.</p></fn><fn id="table1fn3"><p><sup>c</sup>CRNMB: clinically relevant nonmajor bleeding.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-5"><title>Natural Language Processing Model</title><p>To complement structured data detection, we developed a supervised ML model to identify MB, CRNMB, and past bleeding cases documented in discharge summaries.</p><p>A dataset of 400 discharge summaries from CHUV was randomly divided into a training set (n=280) and a test set (n=120), including 100 summaries with MB, 100 with CRNMB, and 200 with no bleeding. Three independent physicians manually annotated the 400 discharge summaries using 4 mutually exclusive labels: (A) &#x2018;presence of CRNMB,&#x2019; (B) &#x2018;presence of MB&#x2019; (as previously defined), (C) &#x2018;history of bleeding&#x2019; (when a discharge summary mentioned bleeding in the EMR before the hospital admission), and (D) &#x2018;absence of any bleeding.&#x2019; Preprocessing steps included tokenization, lemmatization, and sentence segmentation using the French spaCy model (v3.0) [<xref ref-type="bibr" rid="ref28">28</xref>]. The classification pipeline combined logistic regression and support vector machine models, selected for their interpretability and robustness with limited training data. We deliberately used a classical supervised ML model rather than deep learning architectures to ensure interpretability, reproducibility, and computational efficiency, which are essential for clinical validation and routine pharmacovigilance applications. This approach also better suited the relatively small, annotated corpus, allowing transparent feature weighting and easier auditability across institutions. The model was trained using the scikit-learn library (Python v3.9.1). The classification pipeline proceeded in 3 stages: step 1: binary classifier to identify bleeding-relevant versus irrelevant sentences; step 2: multiclass classifier to distinguish between <italic>irrelevant</italic>, <italic>antecedent bleeding</italic>, and <italic>active bleeding</italic>; step 3: binary classifier to further differentiate between MB and CRNMB within sentences flagged as active bleeding. Sentence-level predictions were aggregated to assign a final label to each document. Rules were prioritized as follows: MB&#x003E;CRNMB&#x003E;history of bleeding&#x003E;no bleeding. This ensured a conservative classification hierarchy, favoring the identification of more severe bleeding cases when multiple labels were present. Further methodological details are available in the study proposal previously published [<xref ref-type="bibr" rid="ref25">25</xref>], the related article [<xref ref-type="bibr" rid="ref29">29</xref>], and summarized in <xref ref-type="fig" rid="figure3">Figure 3</xref>.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Natural language processing workflow from raw text input to final classification output. BERT: Bidirectional Encoder Representations From Transformers; DS: discharge summary; HBDSCAN: Hierarchical Density-Based Spatial Clustering of Applications With Noise; UMAP: Uniform Manifold Approximation and Projection.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e77809_fig03.png"/></fig></sec><sec id="s2-6"><title>Validation of the Bleeding Detection Algorithms</title><sec id="s2-6-1"><title>Internal Validation Using CHUV 2015-2016 Data</title><p>To validate the SDA and SDA combined with NLP (SDA+NLP) models, we conducted a manual review of 754 EMRs from CHUV&#x2019;s 2015&#x2010;2016 dataset. The sample size for validation was determined using a test result-based sampling method [<xref ref-type="bibr" rid="ref30">30</xref>]. Assuming a 7% MB, a 10% CRNMB accuracy, and a sensitivity of 0.7, at least 704 EMRs had to be reviewed, and 754 EMRs were effectively reviewed. Four physicians independently reviewed the records to compare algorithm-detected with clinician-identified MB and CRNMB cases. The review process followed a structured protocol aligned with ISTH definitions [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>] and adapted for retrospective application to routinely collected hospital data. Reviewers assessed each inpatient stay according to 4 key criteria: (1) evidence of active bleeding, (2) severity of the event (eg, hemodynamic instability), (3) need for therapeutic intervention (eg, transfusion volume, administration of antihemorrhagic agents), and (4) temporal relationship to hospital admission (present on admission versus occurred during stay). A complete list of synonyms used to identify MB and CRNMB cases during manual chart review is provided in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>. Two binary classification scenarios were evaluated: (1) MB versus all other cases (CRNMB or no bleeding), and (2) CRNMB versus no bleeding (excluding MB). Algorithm performance was evaluated at the inpatient-stay level using standard binary classification metrics (sensitivity, specificity, positive predictive value [PPV], negative predictive value, accuracy, and <italic>F</italic><sub>1</sub>-score), with manual chart review as the gold standard. Comparisons between SDA, NLP, and combined models were descriptive, and sensitivity was prioritized due to the study&#x2019;s patient safety focus. Interrater reliability among reviewers was evaluated using Fleiss &#x03BA; on a subset of 40 cases, with agreement levels interpreted according to Landis and Koch [<xref ref-type="bibr" rid="ref31">31</xref>] (&#x003E;0.80: <italic>almost perfect</italic>; 0.61&#x2010;0.80: <italic>substantial</italic>; 0.41&#x2010;0.60: <italic>moderate</italic>; 0.21&#x2010;0.40: <italic>fair</italic>; 0.00&#x2010;0.20: <italic>slight</italic>; &#x003C;0.00: <italic>poor</italic>). A <italic>P</italic> value associated with the Fleiss &#x03BA; coefficient was also calculated, with a <italic>P</italic> value less than .05 indicating statistically significant agreement. Additional details and results are provided in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>. In a subanalysis, a causal relationship between antithrombotic therapy and each bleeding event was also assessed during the manual review, using a structured tool based on temporal association, biological plausibility, and alternative explanations. Cases were rated as <italic>certain</italic>, <italic>probable</italic>, <italic>possible</italic>, or <italic>unclassified,</italic> in relation to antithrombotic exposure, according to the WHO-Uppsala Monitoring Center scale [<xref ref-type="bibr" rid="ref32">32</xref>]. The methodology, sample size calculation, and findings of the causality assessment of the subanalysis are presented in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p></sec><sec id="s2-6-2"><title>External Validation Using CHUV 2021-2022 Data</title><p>An external validation was performed using CHUV data from 24,054 inpatient stays between January 2021 and December 2022. We applied the same detection algorithms (SDA and SDA+NLP) to this independent dataset to evaluate their performance, robustness, and reproducibility. Results were compared to those from the 2015&#x2010;2016 CHUV dataset.</p></sec></sec><sec id="s2-7"><title>Statistical Analysis</title><p>Descriptive statistics were used to summarize population characteristics. Comorbidity was assessed using the Charlson and Elixhauser indexes [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>], which are validated tools for risk adjustment and mortality prediction based on administrative health data. Comparisons of patient characteristics between hospitals were conducted using a 1-way analysis of variance on ranks (Kruskal-Wallis test) for continuous variables and Pearson &#x03C7;<sup>2</sup> test for categorical variables. Hyperparameters of the NLP classifier were optimized through 5-fold cross-validation on the training set, and final performance was estimated on an independent test set. All performance metrics were reported with 95% CIs calculated using the Wilson method. Analyses were conducted using StataCorp. 2021. Stata Statistical Software: Release 17. College Station, TX: StataCorp LLC software for structured data and Python (v3.9.1) for NLP development.</p></sec><sec id="s2-8"><title>Ethical Considerations</title><sec id="s2-8-1"><title>Human Subject Ethics Review Approvals or Exemptions</title><p>This study was conducted in accordance with the <italic>Declaration of Helsinki</italic> and Swiss federal regulations governing research on human data. Ethical approval was obtained from all relevant cantonal ethics committees, coordinated by the lead committee of the Canton of Vaud (CER-VD No. 2018&#x2010;00272). As the study involved secondary analysis of routinely collected, deidentified hospital data, it qualified for a simplified review under Swiss Human Research Act article 2, paragraph 2(c).</p></sec><sec id="s2-8-2"><title>Informed Consent</title><p>The study relied exclusively on existing clinical data that were deidentified before analysis. According to Swiss regulations and institutional data governance policies, informed consent was waived for patients who had not explicitly objected to the use of their medical data for research purposes. All participating hospitals operate an institutional opt-out procedure, allowing patients to refuse the secondary use of their data for research.</p></sec><sec id="s2-8-3"><title>Privacy and Confidentiality</title><p>All data were deidentified at source before analysis. Structured data were transferred through secure institutional channels to a restricted-access research environment hosted at CHUV. Unstructured textual data remained stored locally on hospital servers and were processed within each institution&#x2019;s secure infrastructure to comply with data protection requirements. No directly identifiable information was accessible to the investigators.</p></sec><sec id="s2-8-4"><title>Compensation Details</title><p>No compensation was provided to patients, as the study involved secondary analysis of preexisting, routinely collected data and did not include direct contact with participants.</p></sec><sec id="s2-8-5"><title>Protection of Identifiable Information in Figures and Supplementary Materials</title><p>No image, document, or figure contains any identifiable patient information. Consequently, no individual consent for image publication was required.</p></sec><sec id="s2-8-6"><title>Ethics Approval</title><p>Approved by the Cantonal Ethics Committee of Vaud, Switzerland (CER-VD No. 2018&#x2010;00272); informed consent was waived for patients who did not opt out of research data use.</p></sec></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Study Population Characteristics</title><p>A total of 36,039 inpatient stays, involving 24,991 unique patients, were included in the analysis: 7677 stays (5754 patients) at CHUV, 18,015 stays (11,356 patients) at HUG, and 10,347 stays (7881 patients) at USZ. Patient characteristics are detailed in <xref ref-type="table" rid="table2">Table 2</xref>. The median age at admission was 78 (IQR 65&#x2010;99) years, with a balanced sex distribution (51.40% male). Comorbidity was generally low across the cohort, with a median Charlson index and Elixhauser index of 0.0; USZ patients had the lowest overall comorbidity burden.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Baseline patient characteristics and treatments: overall and by university hospital.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Characteristics</td><td align="left" valign="bottom">All hospitals (n=36,039)<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="bottom">CHUV<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup> (n=7677)</td><td align="left" valign="bottom">HUG<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup> (n=18,015)</td><td align="left" valign="bottom">USZ<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup> (n=10,347)</td></tr></thead><tbody><tr><td align="left" valign="top"><named-content content-type="indent">Admission age</named-content> (years), median (IQR)</td><td align="left" valign="top">78 (65&#x2010;99)</td><td align="left" valign="top">79 (65&#x2010;99)</td><td align="left" valign="top">80 (65&#x2010;99)</td><td align="left" valign="top">75 (65&#x2010;92)</td></tr><tr><td align="left" valign="top" colspan="5">Sex, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">18,525 (51.40)</td><td align="left" valign="top">3987 (51.93)</td><td align="left" valign="top">8638 (47.95)</td><td align="left" valign="top">5900 (57.02)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Female</td><td align="left" valign="top">17,514 (48.60)</td><td align="left" valign="top">3690 (48.07)</td><td align="left" valign="top">9377 (52.05)</td><td align="left" valign="top">4447 (42.98)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">Length of stay (d)</named-content>, median (IQR)</td><td align="left" valign="top">9 (1-342)</td><td align="left" valign="top">9 (1-293)</td><td align="left" valign="top">12 (1&#x2010;342)</td><td align="left" valign="top">6 (1-145)</td></tr><tr><td align="left" valign="top">Transfer to intensive care, n (%)</td><td align="left" valign="top">1534 (4.26)</td><td align="left" valign="top">467 (6.1)</td><td align="left" valign="top">1067 (5.92)</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup></td></tr><tr><td align="left" valign="top">In-hospital mortality, n (%)</td><td align="left" valign="top">1416 (3.93)</td><td align="left" valign="top">345 (4.5)</td><td align="left" valign="top">850 (4.7)</td><td align="left" valign="top">221 (2.1)</td></tr><tr><td align="left" valign="top" colspan="5">Comorbidity, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chronic renal dysfunction</td><td align="left" valign="top">8418 (23.36)</td><td align="left" valign="top">2163 (28.18)</td><td align="left" valign="top">5662 (31.43)</td><td align="left" valign="top">593 (5.7)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Dialysis</td><td align="left" valign="top">622 (1.7)</td><td align="left" valign="top">176 (2.3)</td><td align="left" valign="top">241 (1.3)</td><td align="left" valign="top">205 (2.0)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Acute renal dysfunction</td><td align="left" valign="top">1151 (3.19)</td><td align="left" valign="top">266 (3.5)</td><td align="left" valign="top">623 (3.5)</td><td align="left" valign="top">262 (2.5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Chronic liver dysfunction</td><td align="left" valign="top">1020 (2.83)</td><td align="left" valign="top">294 (3.8)</td><td align="left" valign="top">497 (2.8)</td><td align="left" valign="top">229 (2.2)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Acute liver dysfunction</td><td align="left" valign="top">498 (1.4)</td><td align="left" valign="top">145 (1.9)</td><td align="left" valign="top">244 (1.4)</td><td align="left" valign="top">109 (1.1)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hypertension</td><td align="left" valign="top">18,316 (50.82)</td><td align="left" valign="top">3158 (41.14)</td><td align="left" valign="top">9271 (51.46)</td><td align="left" valign="top">5887 (56.90)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Alcohol abuse</td><td align="left" valign="top">1354 (3.76)</td><td align="left" valign="top">388 (5.1)</td><td align="left" valign="top">663 (3.7)</td><td align="left" valign="top">303 (2.9)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Stroke</td><td align="left" valign="top">3001 (8.33)</td><td align="left" valign="top">813 (10.6)</td><td align="left" valign="top">1625 (9.02)</td><td align="left" valign="top">563 (5.4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Cancer</td><td align="left" valign="top">6776 (18.80)</td><td align="left" valign="top">1572 (20.48)</td><td align="left" valign="top">2905 (16.13)</td><td align="left" valign="top">2299 (22.22)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Platelet coagulation defect</td><td align="left" valign="top">2178 (6.04)</td><td align="left" valign="top">496 (6.5)</td><td align="left" valign="top">1029 (5.71)</td><td align="left" valign="top">653 (6.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Anemia</td><td align="left" valign="top">7624 (21.15)</td><td align="left" valign="top">1998 (26.03)</td><td align="left" valign="top">4380 (24.31)</td><td align="left" valign="top">1246 (12.04)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Risk fall</td><td align="left" valign="top">11,376 (31.57)</td><td align="left" valign="top">2932 (38.20)</td><td align="left" valign="top">6021 (33.42)</td><td align="left" valign="top">2423 (23.42)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Diabetes</td><td align="left" valign="top">6638 (18.42)</td><td align="left" valign="top">1314 (17.12)</td><td align="left" valign="top">3575 (19.84)</td><td align="left" valign="top">1749 (16.90)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Recent myocardial infection</td><td align="left" valign="top">1923 (5.34)</td><td align="left" valign="top">609 (7.9)</td><td align="left" valign="top">761 (4.2)</td><td align="left" valign="top">553 (5.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Low weight</td><td align="left" valign="top">4059 (11.26)</td><td align="left" valign="top">967 (12.6)</td><td align="left" valign="top">2533 (14.06)</td><td align="left" valign="top">559 (5.4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Thrombolysis</td><td align="left" valign="top">695 (1.9)</td><td align="left" valign="top">180 (2.3)</td><td align="left" valign="top">512 (2.8)</td><td align="left" valign="top">3 (0.0)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Vascular malformation</td><td align="left" valign="top">955 (2.6)</td><td align="left" valign="top">153 (2.0)</td><td align="left" valign="top">334 (1.9)</td><td align="left" valign="top">468 (4.5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">Charlson comorbidity index</named-content>, median (IQR)</td><td align="left" valign="top">0.0 (0.0&#x2010;9.0)</td><td align="left" valign="top">0.0 (0.0&#x2010;9.0)</td><td align="left" valign="top">0.0 (0.0&#x2010;7.0)</td><td align="left" valign="top">0.0 (0.0&#x2010;7.0)</td></tr><tr><td align="left" valign="top">Elixhauser comorbidity index, median (IQR)</td><td align="left" valign="top">0.0 (0.0&#x2010;6.0)</td><td align="left" valign="top">0.0 (0.0&#x2010;6.0)</td><td align="left" valign="top">0.0 (0.0&#x2010;6.0)</td><td align="left" valign="top">0.0 (0.0&#x2010;5.0)</td></tr><tr><td align="left" valign="top" colspan="5">Antithrombotic categories, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Direct factor Xa inhibitors</td><td align="left" valign="top">3297 (9.15)</td><td align="left" valign="top">599 (7.8)</td><td align="left" valign="top">1478 (8.20)</td><td align="left" valign="top">1220 (11.80)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Vitamin K antagonists</td><td align="left" valign="top">7469 (20.72)</td><td align="left" valign="top">1324 (17.25)</td><td align="left" valign="top">4943 (27.44)</td><td align="left" valign="top">1202 (11.62)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Heparin group</td><td align="left" valign="top">24,784 (6877)</td><td align="left" valign="top">5045 (65.71)</td><td align="left" valign="top">11,918 (66.17)</td><td align="left" valign="top">7821 (75.59)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Direct thrombin inhibitors</td><td align="left" valign="top">255 (0.7)</td><td align="left" valign="top">87 (1.1)</td><td align="left" valign="top">134 (0.7)</td><td align="left" valign="top">34 (0.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Platelet aggregation inhibitors</td><td align="left" valign="top">14,220 (39.46)</td><td align="left" valign="top">4354 (56.71)</td><td align="left" valign="top">4700 (26.09)</td><td align="left" valign="top">5166 (49.93)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Thrombolytics</td><td align="left" valign="top">104 (0.3)</td><td align="left" valign="top">15 (0.2)</td><td align="left" valign="top">89 (0.5)</td><td align="left" valign="top">0.0 (0.0)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Other antithrombotic agents: fondaparinux</td><td align="left" valign="top">1365 (3.79)</td><td align="left" valign="top">212 (2.8)</td><td align="left" valign="top">1140 (6.33)</td><td align="left" valign="top">13 (0.1)</td></tr><tr><td align="left" valign="top">Antidotes, n (%)</td><td align="left" valign="top">137 (0.4)</td><td align="left" valign="top">15 (0.2)</td><td align="left" valign="top">122 (0.7)</td><td align="left" valign="top">0.0 (0.0)</td></tr><tr><td align="left" valign="top">Transfusion, n (%)</td><td align="left" valign="top">582 (1.6)</td><td align="left" valign="top">264 (3.4)</td><td align="left" valign="top">318 (1.8)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x2264;5 UI<sup><xref ref-type="table-fn" rid="table2fn6">f</xref></sup> plasma or red blood cells</td><td align="left" valign="top">225 (0.6)</td><td align="left" valign="top">100 (1.3)</td><td align="left" valign="top">125 (0.7)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003E;5 UI plasma or red blood cells</td><td align="left" valign="top">357 (1.0)</td><td align="left" valign="top">164 (2.1)</td><td align="left" valign="top">193 (1.1)</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top" colspan="5">Number of antithrombotic agents received during hospitalization, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">22,397 (62.15)</td><td align="left" valign="top">4257 (55.45)</td><td align="left" valign="top">12,381 (68.73)</td><td align="left" valign="top">5759 (55.66)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">11,918 (33.07)</td><td align="left" valign="top">2904 (37.83)</td><td align="left" valign="top">4924 (27.33)</td><td align="left" valign="top">4090 (39.53)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">1641 (4.55)</td><td align="left" valign="top">495 (6.4)</td><td align="left" valign="top">669 (3.7)</td><td align="left" valign="top">477 (4.6)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x2265;4</td><td align="left" valign="top">83 (0.2)</td><td align="left" valign="top">21 (0.3)</td><td align="left" valign="top">41 (0.2)</td><td align="left" valign="top">21 (0.2)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>n: total number of recorded measurements for the respective parameter. </p></fn><fn id="table2fn2"><p><sup>b</sup>CHUV: Lausanne University Hospital.</p></fn><fn id="table2fn3"><p><sup>c</sup>HUG: Geneva University Hospital. </p></fn><fn id="table2fn4"><p><sup>d</sup>USZ: Z&#x00FC;rich University Hospital. </p></fn><fn id="table2fn5"><p><sup>e</sup>Not available (missing or nontransferred data).</p></fn><fn id="table2fn6"><p><sup>f</sup>UI: unit of blood component. </p></fn></table-wrap-foot></table-wrap><p>Distinct prescribing patterns were observed across hospitals: HUG had the highest use of vitamin K antagonists (n=4943, 27.44%), CHUV had the highest prescription rate of antiplatelet agents (n=4354, 56.71%), and USZ reported the highest use of direct factor Xa inhibitors (n=1220, 11.79%) and heparins (n=7821, 75.59%). Hypertension (n=18,316, 50.82%), chronic renal dysfunction (n=8418, 23.36%), anemia (n=7624, 21.15%), and cancer (n=6776, 18.80%) were among the most prevalent comorbidities. Overall, in-hospital mortality was 3.93% (n=1416).</p></sec><sec id="s3-2"><title>Bleeding Detection Using SDA</title><p>SDA detected 8748 (24.27%) overall bleeding cases, of which 2979 (8.26%) were MB cases and 5419 (15.04%) were CRNMB cases (<xref ref-type="table" rid="table3">Table 3</xref>). Fatal MB occurred in 1.0% (n=350) of all stays. MB prevalence varied across hospitals, with the highest proportion observed at CHUV (n=769, 10.0%), followed by USZ (n=998, 9.6%) and HUG (n=1212, 6.73%). CRNMB prevalence was highest at USZ (n=1682, 16.26%). Missing values for each variable used to identify MB and CRNMB events are presented in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Prevalence of bleeding cases detected by SDA<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup>, overall and by university hospital<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup>.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">All hospitals, n (%)</td><td align="left" valign="bottom">CHUV<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup>, n (%)</td><td align="left" valign="bottom">HUG<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup>, n (%)</td><td align="left" valign="bottom">USZ<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup>, n (%)</td><td align="left" valign="bottom"><italic>P</italic> value<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top">Nonbleeding-related</td><td align="left" valign="top">27,641 (76.70)</td><td align="left" valign="top">5822 (75.84)</td><td align="left" valign="top">14,152 (78.56)</td><td align="left" valign="top">7667 (74.10)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">CRNMB<sup><xref ref-type="table-fn" rid="table3fn7">g</xref></sup></td><td align="left" valign="top">5419 (15.04)</td><td align="left" valign="top">1086 (14.15)</td><td align="left" valign="top">2651 (14.72)</td><td align="left" valign="top">1682 (16.26)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">MB<sup><xref ref-type="table-fn" rid="table3fn8">h</xref></sup></td><td align="left" valign="top">2979 (8.26)</td><td align="left" valign="top">769 (10.0)</td><td align="left" valign="top">1212 (6.73)</td><td align="left" valign="top">998 (9.6)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">MB in-hospital mortality</td><td align="left" valign="top">350 (1.0)</td><td align="left" valign="top">119 (1.6)</td><td align="left" valign="top">137 (0.8)</td><td align="left" valign="top">94 (0.9)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Total</td><td align="left" valign="top">36,039</td><td align="left" valign="top">7677</td><td align="left" valign="top">18,015</td><td align="left" valign="top">10,347</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table3fn9">i</xref></sup></td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>SDA: structured data algorithms (ie, rule-based algorithm for structured data).</p></fn><fn id="table3fn2"><p><sup>b</sup>Bleeding cases: number of stays for patients treated with at least 1 antithrombotic agent during which at least 1 bleeding episode occurred.</p></fn><fn id="table3fn3"><p><sup>c</sup>CHUV: Lausanne University Hospital.</p></fn><fn id="table3fn4"><p><sup>d</sup>HUG: Geneva University Hospital.</p></fn><fn id="table3fn5"><p><sup>e</sup>USZ: Z&#x00FC;rich University Hospital.</p></fn><fn id="table3fn6"><p><sup>f</sup>Using Pearson <italic>&#x03C7;</italic><sup>2</sup> test.</p></fn><fn id="table3fn7"><p><sup>g</sup>CRNMB: clinically relevant nonmajor bleeding.</p></fn><fn id="table3fn8"><p><sup>h</sup>MB: major bleeding.</p></fn><fn id="table3fn9"><p><sup>i</sup>Not applicable.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-3"><title>Relative and Absolute Contribution of Structured Data Sources</title><p>Laboratory data were the most influential source for detecting both MB and CRNMB, contributing to two-thirds of identified cases, while <italic>ICD-10-GM</italic> codes contributed to approximately one-third. Prescriptions for antihemorrhagic agents had a minimal added value for MB detection, while transfusion data contributed modestly. <xref ref-type="fig" rid="figure4">Figure 4</xref> illustrates the relative contribution of each data source.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Relative contribution of structured data sources (laboratory data, <italic>ICD-10-GM</italic> codes, prescription of antihemorrhagic agents, and transfusions) to the detection of major bleeding (MB) and clinically relevant nonmajor bleeding (CRNMB). <italic>ICD-10-GM</italic>: <italic>International Statistical Classification of Diseases, 10th Revision, German Modification</italic>.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e77809_fig04.png"/></fig><p>Overlap between data sources was limited. Only 12.1% (n=361) of MB stays and 8.7% (n=458) of CRNMB stays were identified by 2 data sources, while detection by all 4 sources occurred in 0% of MB cases and only 0% (n=12) of CRNMB cases (<xref ref-type="fig" rid="figure5">Figure 5</xref>). This limited overlap highlights the complementarity, but also fragmentation, of structured data signals.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Absolute contribution of structured data sources (laboratory data, <italic>ICD-10-GM</italic> codes, prescription of antihemorrhagic agents, and transfusions) to the detection of (A) major bleeding and (B) clinically relevant nonmajor bleeding. <italic>ICD-10-GM: International Statistical Classification of Diseases, 10th Revision, German Modification</italic>.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e77809_fig05.png"/></fig></sec><sec id="s3-4"><title>Combined Detection Using SDA and NLP (CHUV Only)</title><p>Among 7513 CHUV stays with discharge summaries, combining SDA and NLP increased case detection: In total, 39.69% (n=2982) of hemorrhagic cases were detected: 12.2% (n=920) were identified as MB and 27.45% (n=2062) as CRNMB.</p><p>For MB cases, 56.6% (n=521) were detected by SDA alone, 19.8% (n=182) by NLP alone, and 23.6% (n=217) by both. For CRNMB cases, 35.1% (n=724) were detected by SDA alone, 48.2% (n=994) by NLP alone, and 16.7% (n=344) by both.</p><p>Classification discrepancies were observed between SDA and NLP: 217 cases identified as MB by SDA were reclassified as CRNMB by NLP, and conversely, 81 CRNMB cases by SDA were reclassified as MB by NLP. NLP also enabled the detection of a history of bleeding in 8.5% (n=642) of cases, improving the temporal resolution of hemorrhage onset.</p></sec><sec id="s3-5"><title>Internal Validation Using CHUV 2015-2016 Data</title><p>The manual review of 754 EMRs identified 276 bleeding cases: 144 MB and 132 CRNMB. Structured laboratory data showed the highest sensitivity (0.58, 95% CI 0.52&#x2010;0.64), while <italic>ICD-10-GM</italic> codes had the highest PPV (0.89, 95% CI 0.83&#x2010;0.98), and <italic>F</italic><sub>1</sub>-score (0.60). SDA outperformed NLP in sensitivity (0.77 vs 0.61), but NLP had higher PPV (0.70 vs 0.51) and <italic>F</italic><sub>1</sub>-score (0.65 vs 0.62). The best performance was achieved by the combined <italic>ICD-10-GM</italic>&#x222A;NLP algorithm, with a sensitivity of 0.71 (95% CI 0.66&#x2010;0.76), PPV of 0.72 (95% CI 0.66&#x2010;0.87), and <italic>F</italic><sub>1</sub>-score of 0.72. Algorithms combining SDA and NLP yielded the highest sensitivity (0.84), confirming the benefit of multimodal approaches. However, intersection-based algorithms (eg, SDA&#x2229;NLP) demonstrated higher specificity at the cost of reduced sensitivity.</p><p>Performance metrics for MB and CRNMB subgroups followed similar trends, with reduced sensitivity but high specificity for <italic>ICD-10-GM</italic>&#x2013;based detection. <xref ref-type="table" rid="table4">Table 4</xref> presents a comprehensive summary of all performance metrics, including sensitivity, specificity, PPV, negative predictive value, accuracy, and <italic>F</italic><sub>1</sub>-score.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Performance metrics of bleeding detection algorithms compared to manual electronic medical records review (gold standard; n=754)<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup>.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Sensitivity<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup> (95% CI)</td><td align="left" valign="bottom">Specificity<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup> (95% CI)</td><td align="left" valign="bottom">PPV<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup> (95% CI)</td><td align="left" valign="bottom">NPV<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup> (95% CI)</td><td align="left" valign="bottom">Accuracy<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup> (95% CI)</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top" colspan="7">Bleeding all type (MB<sup><xref ref-type="table-fn" rid="table4fn8">h</xref></sup> or CRNMB<sup><xref ref-type="table-fn" rid="table4fn9">i</xref></sup>)</td></tr><tr><td align="left" valign="top" colspan="7"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Individual structured data sources</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>ICD-10-GM</italic><sup><xref ref-type="table-fn" rid="table4fn10">j</xref></sup></td><td align="left" valign="top">0.46 (0.40&#x2010;0.51)</td><td align="left" valign="top">0.97 (0.95&#x2010;0.98)</td><td align="left" valign="top">0.89 (0.83&#x2010;0.98)</td><td align="left" valign="top">0.75 (0.72&#x2010;0.79)</td><td align="left" valign="top">0.78 (0.75&#x2010;0.81)</td><td align="left" valign="top">0.60</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Laboratory data</td><td align="left" valign="top">0.58 (0.52&#x2010;0.64)</td><td align="left" valign="top">0.60 (0.55&#x2010;0.64)</td><td align="left" valign="top">0.45 (0.40&#x2010;0.64)</td><td align="left" valign="top">0.71 (0.66&#x2010;0.75)</td><td align="left" valign="top">0.59 (0.55&#x2010;0.62)</td><td align="left" valign="top">0.51</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Whole blood or red blood cells transfusion</td><td align="left" valign="top">0.18 (0.14&#x2010;0.23)</td><td align="left" valign="top">0.95 (0.93&#x2010;0.97)</td><td align="left" valign="top">0.68 (0.57&#x2010;0.97)</td><td align="left" valign="top">0.67 (0.63&#x2010;0.70)</td><td align="left" valign="top">0.67 (0.63&#x2010;0.70)</td><td align="left" valign="top">0.29</td></tr><tr><td align="left" valign="top" colspan="7"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Detection algorithms</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SDA<sup><xref ref-type="table-fn" rid="table4fn11">k</xref></sup></td><td align="left" valign="top">0.77 (0.72&#x2010;0.82)</td><td align="left" valign="top">0.58 (0.54&#x2010;0.62)</td><td align="left" valign="top">0.51 (0.47&#x2010;0.62)</td><td align="left" valign="top">0.81 (0.77&#x2010;0.85)</td><td align="left" valign="top">0.65 (0.62&#x2010;0.68)</td><td align="left" valign="top">0.62</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>NLP<sup><xref ref-type="table-fn" rid="table4fn12">l</xref></sup></td><td align="left" valign="top">0.61 (0.55&#x2010;0.67)</td><td align="left" valign="top">0.85 (0.81&#x2010;0.88)</td><td align="left" valign="top">0.70 (0.64&#x2010;0.88)</td><td align="left" valign="top">0.79 (0.75&#x2010;0.82)</td><td align="left" valign="top">0.76 (0.73&#x2010;0.79)</td><td align="left" valign="top">0.65</td></tr><tr><td align="left" valign="top" colspan="7"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Combined data sources and algorithms</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SDA&#x222A;NLP</td><td align="left" valign="top">0.84 (0.79&#x2010;0.88)</td><td align="left" valign="top">0.54 (0.49&#x2010;0.58)</td><td align="left" valign="top">0.51 (0.47&#x2010;0.58)</td><td align="left" valign="top">0.85 (0.81&#x2010;0.89)</td><td align="left" valign="top">0.65 (0.61&#x2010;0.68)</td><td align="left" valign="top">0.64</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SDA&#x2229;NLP</td><td align="left" valign="top">0.47 (0.41&#x2010;0.53)</td><td align="left" valign="top">0.92 (0.89&#x2010;0.94)</td><td align="left" valign="top">0.78 (0.71&#x2010;0.94)</td><td align="left" valign="top">0.75 (0.71&#x2010;0.78)</td><td align="left" valign="top">0.76 (0.72&#x2010;0.79)</td><td align="left" valign="top">0.59</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>ICD-10-GM</italic>&#x222A;NLP</td><td align="left" valign="top">0.71 (0.66&#x2010;0.76)</td><td align="left" valign="top">0.84 (0.80&#x2010;0.87)</td><td align="left" valign="top">0.72 (0.66&#x2010;0.87)</td><td align="left" valign="top">0.83 (0.80&#x2010;0.86)</td><td align="left" valign="top">0.79 (0.76&#x2010;0.82)</td><td align="left" valign="top">0.72</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>ICD-10-GM</italic>&#x2229;NLP</td><td align="left" valign="top">0.31 (0.26&#x2010;0.37)</td><td align="left" valign="top">0.99 (0.98&#x2010;1.00)</td><td align="left" valign="top">0.95 (0.89&#x2010;1.00)</td><td align="left" valign="top">0.71 (0.68&#x2010;0.74)</td><td align="left" valign="top">0.74 (0.71&#x2010;0.77)</td><td align="left" valign="top">0.47</td></tr><tr><td align="left" valign="top" colspan="7">MB</td></tr><tr><td align="left" valign="top" colspan="7"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Individual structured data sources</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>ICD-10-GM</italic></td><td align="left" valign="top">0.34 (0.27&#x2010;0.42)</td><td align="left" valign="top">0.99 (0.97&#x2010;0.99)</td><td align="left" valign="top">0.84 (0.73&#x2010;0.99)</td><td align="left" valign="top">0.86 (0.84&#x2010;0.89)</td><td align="left" valign="top">0.86 (0.84&#x2010;0.88)</td><td align="left" valign="top">0.49</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Laboratory data</td><td align="left" valign="top">0.47 (0.39&#x2010;0.55)</td><td align="left" valign="top">0.81 (0.77&#x2010;0.84)</td><td align="left" valign="top">0.36 (0.30&#x2010;0.84)</td><td align="left" valign="top">0.86 (0.83&#x2010;0.89)</td><td align="left" valign="top">0.74 (0.71&#x2010;0.77)</td><td align="left" valign="top">0.41</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Whole blood or red blood cells transfusion</td><td align="left" valign="top">0.22 (0.16&#x2010;0.29)</td><td align="left" valign="top">0.97 (0.96&#x2010;0.98)</td><td align="left" valign="top">0.66 (0.52&#x2010;0.98)</td><td align="left" valign="top">0.84 (0.81&#x2010;0.87)</td><td align="left" valign="top">0.83 (0.80&#x2010;0.85)</td><td align="left" valign="top">0.32</td></tr><tr><td align="left" valign="top" colspan="7"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Algorithms</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SDA</td><td align="left" valign="top">0.72 (0.64&#x2010;0.78)</td><td align="left" valign="top">0.79 (0.76&#x2010;0.82)</td><td align="left" valign="top">0.45 (0.39&#x2010;0.82)</td><td align="left" valign="top">0.92 (0.90&#x2010;0.94)</td><td align="left" valign="top">0.78 (0.75&#x2010;0.81)</td><td align="left" valign="top">0.55</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>NLP</td><td align="left" valign="top">0.35 (0.28&#x2010;0.44)</td><td align="left" valign="top">0.95 (0.93&#x2010;0.96)</td><td align="left" valign="top">0.63 (0.51&#x2010;0.96)</td><td align="left" valign="top">0.86 (0.83&#x2010;0.89)</td><td align="left" valign="top">0.84 (0.81&#x2010;0.86)</td><td align="left" valign="top">0.45</td></tr><tr><td align="left" valign="top" colspan="7"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Combined data sources and algorithms</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SDA&#x222A;NLP</td><td align="left" valign="top">0.76 (0.68&#x2010;0.82)</td><td align="left" valign="top">0.79 (0.75&#x2010;0.81)</td><td align="left" valign="top">0.46 (0.39&#x2010;0.82)</td><td align="left" valign="top">0.93 (0.91&#x2010;0.95)</td><td align="left" valign="top">0.78 (0.75&#x2010;0.81)</td><td align="left" valign="top">0.57</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SDA&#x2229;NLP</td><td align="left" valign="top">0.30 (0.23&#x2010;0.39)</td><td align="left" valign="top">0.96 (0.94&#x2010;0.97)</td><td align="left" valign="top">0.64 (0.52&#x2010;0.97)</td><td align="left" valign="top">0.85 (0.83&#x2010;0.88)</td><td align="left" valign="top">0.83 (0.81&#x2010;0.86)</td><td align="left" valign="top">0.41</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>ICD-10-GM</italic>&#x222A;NLP</td><td align="left" valign="top">0.56 (0.48&#x2010;0.64)</td><td align="left" valign="top">0.94 (0.92&#x2010;0.96)</td><td align="left" valign="top">0.69 (0.60&#x2010;0.96)</td><td align="left" valign="top">0.90 (0.87&#x2010;0.92)</td><td align="left" valign="top">0.87 (0.84&#x2010;0.89)</td><td align="left" valign="top">0.62</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>ICD-10-GM</italic>&#x2229;NLP</td><td align="left" valign="top">0.14 (0.09&#x2010;0.21)</td><td align="left" valign="top">1.0 (0.99&#x2010;1.00)</td><td align="left" valign="top">0.91 (0.72&#x2010;1.00)</td><td align="left" valign="top">0.83 (0.80&#x2010;0.86)</td><td align="left" valign="top">0.83 (0.80&#x2010;0.86)</td><td align="left" valign="top">0.25</td></tr><tr><td align="left" valign="top" colspan="7">CRNMB</td></tr><tr><td align="left" valign="top" colspan="7"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Individual structured data sources</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>ICD-10-GM</italic></td><td align="left" valign="top">0.30 (0.23&#x2010;0.39)</td><td align="left" valign="top">0.91 (0.88&#x2010;0.93)</td><td align="left" valign="top">0.41 (0.32&#x2010;0.93)</td><td align="left" valign="top">0.86 (0.83&#x2010;0.88)</td><td align="left" valign="top">0.80 (0.77&#x2010;0.83)</td><td align="left" valign="top">0.35</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Laboratory data</td><td align="left" valign="top">0.25 (0.18&#x2010;0.33)</td><td align="left" valign="top">0.73 (0.70&#x2010;0.77)</td><td align="left" valign="top">0.17 (0.12&#x2010;0.77)</td><td align="left" valign="top">0.82 (0.79&#x2010;0.85)</td><td align="left" valign="top">0.65 (0.61&#x2010;0.68)</td><td align="left" valign="top">0.20</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Whole blood or red blood cells transfusion</td><td align="left" valign="top">0.03 (0.01&#x2010;0.07)</td><td align="left" valign="top">0.96 (0.95&#x2010;0.98)</td><td align="left" valign="top">0.15 (0.06&#x2010;0.98)</td><td align="left" valign="top">0.82 (0.79&#x2010;0.85)</td><td align="left" valign="top">0.80 (0.77&#x2010;0.83)</td><td align="left" valign="top">0.05</td></tr><tr><td align="left" valign="top" colspan="7"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Detection algorithms</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SDA</td><td align="left" valign="top">0.65 (0.42&#x2010;0.58)</td><td align="left" valign="top">0.65 (0.62&#x2010;0.69)</td><td align="left" valign="top">0.23 (0.19&#x2010;0.69)</td><td align="left" valign="top">0.86 (0.82&#x2010;0.89)</td><td align="left" valign="top">0.63 (0.59&#x2010;0.66)</td><td align="left" valign="top">0.32</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>NLP</td><td align="left" valign="top">0.53 (0.45&#x2010;0.62)</td><td align="left" valign="top">0.77 (0.74&#x2010;0.81)</td><td align="left" valign="top">0.34 (0.28&#x2010;0.81)</td><td align="left" valign="top">0.89 (0.86&#x2010;0.91)</td><td align="left" valign="top">0.73 (0.70&#x2010;0.76)</td><td align="left" valign="top">0.41</td></tr><tr><td align="left" valign="top" colspan="7"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Combined data sources and algorithms</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SDA&#x222A;NLP</td><td align="left" valign="top">0.66 (0.57&#x2010;0.73)</td><td align="left" valign="top">0.56 (0.52&#x2010;0.60)</td><td align="left" valign="top">0.24 (0.20&#x2010;0.60)</td><td align="left" valign="top">0.88 (0.85&#x2010;0.91)</td><td align="left" valign="top">0.58 (0.54&#x2010;0.61)</td><td align="left" valign="top">0.35</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SDA&#x2229;NLP</td><td align="left" valign="top">0.38 (0.30&#x2010;0.47)</td><td align="left" valign="top">0.88 (0.84&#x2010;0.90)</td><td align="left" valign="top">0.40 (0.32&#x2010;0.90)</td><td align="left" valign="top">0.87 (0.84&#x2010;0.89)</td><td align="left" valign="top">0.79 (0.76&#x2010;0.82)</td><td align="left" valign="top">0.39</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>ICD-10-GM</italic>&#x222A;NLP</td><td align="left" valign="top">0.60 (0.52&#x2010;0.68)</td><td align="left" valign="top">0.75 (0.72&#x2010;0.79)</td><td align="left" valign="top">0.35 (0.29&#x2010;0.79)</td><td align="left" valign="top">0.90 (0.87&#x2010;0.92)</td><td align="left" valign="top">0.73 (0.69&#x2010;0.76)</td><td align="left" valign="top">0.44</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content><italic>ICD-10-GM</italic>&#x2229;NLP</td><td align="left" valign="top">0.24 (0.17&#x2010;0.32)</td><td align="left" valign="top">0.93 (0.91&#x2010;0.95)</td><td align="left" valign="top">0.42 (0.31&#x2010;0.95)</td><td align="left" valign="top">0.85 (0.82&#x2010;0.87)</td><td align="left" valign="top">0.81 (0.78&#x2010;0.83)</td><td align="left" valign="top">0.30</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>It should be noted that no patient record contained the variable antihemorrhagic agent for the detection of MB. Consequently, the performance for this variable was not included in the table.</p></fn><fn id="table4fn2"><p><sup>b</sup>Sensitivity: proportion of bleeding cases that have been correctly identified.</p></fn><fn id="table4fn3"><p><sup>c</sup>Specificity: proportion of nonbleeding-related cases that have been correctly identified.</p></fn><fn id="table4fn4"><p><sup>d</sup>PPV: positive predictive value; proportion of bleeding cases among all those classified as bleeding cases by the algorithm.</p></fn><fn id="table4fn5"><p><sup>e</sup>NPV: negative predictive value; proportion of nonbleeding-related cases among all those classified as nonbleeding-related cases by the algorithm.</p></fn><fn id="table4fn6"><p><sup>f</sup>Accuracy: overall prediction accuracy (ie, the proportion of bleeding and nonbleeding-related cases that the algorithm has correctly identified.</p></fn><fn id="table4fn7"><p><sup>g</sup><italic>F</italic><sub>1</sub>-score: harmonic mean of the precision and recall (ie, <italic>F</italic><sub>1</sub>-score = 2 &#x00D7; [recall &#x00D7; precision]/[recall + precision]).</p></fn><fn id="table4fn8"><p><sup>h</sup>MB: major bleeding.</p></fn><fn id="table4fn9"><p><sup>i</sup>CRNMB: clinically relevant nonmajor bleeding.</p></fn><fn id="table4fn10"><p><sup>j</sup><italic>ICD-10-GM</italic>: <italic>International Statistical Classification of Diseases, 10th Revision, German Modification</italic>. </p></fn><fn id="table4fn11"><p><sup>k</sup>SDA: structured data algorithm.</p></fn><fn id="table4fn12"><p><sup>l</sup>NLP: natural language processing.</p></fn></table-wrap-foot></table-wrap><p>Interrater reliability for manual review of 40 EMRs showed substantial agreement: Fleiss&#x2019; Kappa was 0.65 for bleeding detection and 0.61 for MB versus CRNMB classification. Of 276 manually reviewed inpatient stays with bleeding events, 17% (n=48) were attributed to antithrombotic agents. The causal relationship was classified as &#x201C;certain&#x201D; in 25% of cases (n=12), &#x201C;probable/likely&#x201D; in 23% (n=11), and &#x201C;possible&#x201D; in 52% (n=25).</p></sec><sec id="s3-6"><title>External Validation Using CHUV 2021-2022 Data</title><p>Application of the SDA and SDA+NLP algorithms to the CHUV validation dataset (24054 stays) demonstrated generalizability. The prevalence of MB cases significantly decreased from 10.0% in the 2015&#x2010;2016 period to 5.55% (n=1336) in the 2021&#x2010;2022 period, while the prevalence of CRNMB cases increased significantly from 14.15% to 16.63% (n=4000). MB in-hospital mortality also rose, from 1.6% to 2.6% (n=616).</p><p>Patient characteristics differed significantly between cohorts (<xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>). Direct oral anticoagulant prescriptions increased from 7.8% to 22.7%, while vitamin K antagonist use decreased from 17.2% to 7.6%. The incidence of elevated INR values &#x003E;4 declined from 3.3% to 1.8%. Both Charlson and Elixhauser scores increased, reflecting higher comorbidity. Transfusions involving &#x2264;5 units of blood rose from 1.3% to 8.8%. Notably, the proportion of patients receiving &#x2265;3 antithrombotic agents during hospitalization increased fivefold (from 6.7% to 35.0%).</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>To our knowledge, this is one of the first multicenter studies assessing the feasibility and effectiveness of combining structured and unstructured EMR data to detect bleeding cases in older inpatients treated by one or more antithrombotic agents. Across 3 large university hospitals, our SDA identified 8.26% of MB and 15.4% of CRNMB cases. Laboratory variables contributed most to event detection, while <italic>ICD-10-GM</italic> codes alone captured only about one-third of cases, achieving a sensitivity of 0.84 when both data sources were combined. These findings confirm the feasibility of automated bleeding surveillance in real-world hospital data and demonstrate the added value of leveraging free-text information to complement structured data sources.</p></sec><sec id="s4-2"><title>Comparison to Prior Work</title><p>Our estimated bleeding rates (MB: 8.26% and CRNMB: 15.04%) are consistent with prior hospital-based studies in older adults, which reported MB incidences ranging from 1.8% to 11.3% [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>] and CRNMB from 3.5% to 13.0% [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. These findings confirm that antithrombotic-related bleeding remains a major cause of ADEs in older populations, associated with increased hospitalization length, morbidity, and mortality [<xref ref-type="bibr" rid="ref38">38</xref>], highlighting the need for targeted preventive strategies.</p><p>The algorithms&#x2019; performance varied across structured data sources and aligns with prior research. <italic>ICD-10-GM</italic> codes detected only one-third of MB and CRNMB cases, consistent with previous evidence of underreporting anticoagulant-related bleeding events [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]. Yap et al [<xref ref-type="bibr" rid="ref15">15</xref>] found similarly low sensitivity (16%&#x2010;24%) but very high PPV (&#x003E;0.97), indicating that diagnostic codes are reliable confirmatory markers but poor screening tools. The inclusion of laboratory data markedly improved sensitivity in our SDA model, consistent with findings by Dyas et al [<xref ref-type="bibr" rid="ref6">6</xref>] and Shung et al [<xref ref-type="bibr" rid="ref10">10</xref>]. The modest decline in PPV was likely due to false positives generated by hemoglobin thresholds, a limitation noted in earlier work [<xref ref-type="bibr" rid="ref15">15</xref>].</p><p>Detection of CRNMB was more challenging than MB, partly due to broader definitions and lower specificity of <italic>ICD-10-GM</italic> codes and transfusion data, echoing the moderate performance reported by Yap et al [<xref ref-type="bibr" rid="ref15">15</xref>] (sensitivity 50%&#x2010;56%, PPV 43&#x2010;50%).</p><p>The NLP model contributed substantially to overall detection, with a sensitivity of 61% and PPV of 70%, in line with earlier NLP-based models for bleeding and ADE detection [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]. Importantly, only about 20% of events overlapped with those captured by structured data, demonstrating that text analysis retrieves unique clinical insights often missing from coded data. NLP also enhanced temporal resolution by identifying prior bleeding episodes in 8.5% of cases, information generally unavailable from structured data alone. The combined SDA+NLP model achieved high sensitivity (0.84), thereby minimizing the risk of missed events, with only 16% of cases being false negatives. Although this proportion is relatively low, it still represents missed hemorrhagic events that could impact the accuracy of retrospective surveillance and safety signal detection. However, our detection algorithm provides a notable proportion of false positives (49%), which could contribute to alert fatigue in clinical practice and increase the workload associated with unnecessary chart reviews. For real-world deployment, performance thresholds depend on the intended use: for surveillance or signal detection, a sensitivity above 0.80 with PPV above 0.50 is generally acceptable, as false positives can be secondarily reviewed; for clinical decision support, stricter thresholds (eg, PPV&#x2265;0.70) are needed to prevent alert fatigue. Improving true positive detection to 70% would strengthen reliability and clinical applicability, potentially through prioritization or triage of clinically significant cases.</p><p>External validation revealed a decline in MB prevalence and a concurrent increase in CRNMB and MB-related mortality in the validation dataset (2021&#x2010;2022), compared to the CHUV 2015&#x2010;2016 dataset. These trends may reflect evolving prescribing patterns, such as increased use of direct oral anticoagulants and reduced use of vitamin K antagonists, and a shift in clinical profiles, with higher comorbidity scores and greater treatment complexity in the more recent cohort. These observations are consistent with the known bleeding risk profiles of antithrombotic agents, direct oral anticoagulants being more frequently associated with gastrointestinal bleeding (CRNMB), and vitamin K antagonists with intracranial bleeding (MB) [<xref ref-type="bibr" rid="ref42">42</xref>], and underscore the need for dynamic algorithmic models capable of adjusting for changing treatment patterns and patient characteristics [<xref ref-type="bibr" rid="ref43">43</xref>].</p></sec><sec id="s4-3"><title>Strengths and Limitations</title><p>This study has several notable strengths. It is one of the first multicenter initiatives to integrate structured and unstructured EMR data for ADE detection in older hospitalized patients. The inclusion of 3 university hospitals provided a large, diverse dataset, while the harmonization of over 1 million clinical variables ensured robust data quality. Algorithms were developed using internationally accepted definitions of MB and CRNMB and validated through manual chart review, ensuring clinical credibility. External validation on a temporally distinct dataset further reinforced reproducibility and robustness.</p><p>Several limitations should also be considered.</p><p>First, the test dataset (2015&#x2010;2016) was relatively dated and spanned only 2 years, reflecting mostly the time-consuming extraction and harmonization process required to merge data from three hospitals before data interoperability infrastructures were implemented. Consequently, it may not entirely capture current clinical practices. Nevertheless, this limitation was mitigated by validating our pipeline on an independent and more recent dataset.</p><p>Second, NLP development and validation were performed using CHUV data only and did not take into consideration interinstitutional variations in coding practices, hospital information system architecture and interoperability, clinical documentation standards, or local prescribing patterns, which may limit the generalizability of our findings. To mitigate this, the model was trained on a balanced, manually annotated corpus reviewed by 3 independent physicians. Future studies should externally validate the NLP model on datasets from other French-speaking institutions to confirm its performance and enhance its applicability.</p><p>Third, data from 1 hospital (Baden hospital) were excluded due to missing information and harmonization challenges, and CHOP codes could not be extracted from the USZ hospital; this could have led to underestimation of certain bleeding events. Recent efforts have been undertaken to improve data harmonization across sites, which now largely mitigate the harmonization challenges previously encountered.</p><p>Fourth, while <italic>ICD-10-GM</italic> code selection was based on international guidelines and expert review, some misclassification may have occurred. This limitation was partly mitigated by manual validation. However, the adoption of a standardized bleeding classification would help overcome this limitation and harmonize bleeding-event categorization across studies.</p><p>Fifth, causality assessment between bleeding cases and antithrombotic agents was not formally assessed by our algorithms, as this requires strict criteria and necessitates a comprehensive EMR review. Causality was manually evaluated using the WHO&#x2013;Uppsala Monitoring Center framework, which provided valuable contextual insights but is resource-intensive. Future work should investigate semiautomated causal-inference tools to scale this process efficiently.</p><p>Sixth, structured data were insufficient to capture the timing of bleeding cases prior to admission, as such information is documented in discharge summaries, underscoring the need for unstructured data in ADE detection.</p><p>Finally, all participating hospitals were tertiary academic centers with strong data infrastructures and comprehensive documentation practices. While this ensured data reliability and methodological consistency, it may limit the generalizability of our findings to other contexts, such as secondary or community hospitals, or to health systems with different digital maturity levels. Compared to many international settings, Swiss university hospitals operate within a decentralized but highly standardized health care system, characterized by universal coverage and well-developed inpatient services. Future research should evaluate these algorithms in more diverse hospital types and countries to assess their adaptability and scalability beyond tertiary Swiss institutions.</p></sec><sec id="s4-4"><title>Future Directions</title><p>This study illustrates the value of combining structured and unstructured clinical data to improve the detection of bleeding events in older inpatients exposed to antithrombotic therapy. This integrated approach can enhance pharmacovigilance systems, reduce underreporting, and support timely clinical interventions. Future efforts should expand algorithm coverage to additional unstructured sources (eg, nursing notes and consultation letters), improve clinical documentation practices, and incorporate semiautomated causality assessment tools. Combining these detection models with multivariate risk stratification that integrates patient-specific factors (age, comorbidities, comedications, and clinical service) could enable prioritization of clinically meaningful alerts. Finally, embedding such tools within common data models and privacy-preserving data-sharing infrastructures, such as those promoted by the Swiss Personalized Health Network, could facilitate cross-institutional learning health systems and accelerate artificial intelligence-supported pharmacovigilance in real-world clinical practice.</p></sec></sec></body><back><ack><p>The authors thank all contributors to data extraction and processing across participating sites, with special appreciation to Walid Gharib-Blanc and Alexandre Wetzel. We gratefully acknowledge Tapio Niemi, Marie Bettex, and Patrick Taff&#x00E9; (Unisant&#x00E9;, Department of Epidemiology and Health Systems, University of Lausanne, Switzerland).</p><p>The SwissMADE collaborators are Bernard Burnand, Department of Epidemiology and Health Systems, Unisant&#x00E9; and University of Lausanne, Lausanne, Switzerland; Pierre Olivier Lang, Geriatric Medicine and Geriatric Rehabilitation Division, Department of Medicine, University Hospital of Lausanne, Lausanne, Switzerland; Nicola Colic, Dalle Molle Institute for Artificial Intelligence Research, Universit&#x00E0; della Svizzera Italiana, Lugano, Switzerland; Angela Schulthess-Lisibach, Institute of Primary Health Care, University of Bern, Bern, Switzerland; Christophe Gaudet-Blavignac, Division of Medical Information Sciences, Geneva University Hospitals, Geneva, Switzerland and Department of Radiology and Medical Informatics, University of Geneva, Geneva, Switzerland; Nathalie Casati, Clinical Data Science Group, Lausanne University Hospital, Lausanne, Switzerland; Jean-Philippe Goldman, Faculty of Letters, Department of Linguistics, University of Geneva, Geneva, Switzerland; and Vasiliki Foufi, Division of Medical Information Sciences, University Hospitals of Geneva, Geneva, Switzerland and Faculty of Medicine, University of Geneva, Geneva, Switzerland.</p></ack><notes><sec><title>Funding</title><p>This study was partially supported by the Swiss National Research Fund (project 167381). The funder had no role in study design, data collection, data analysis, data interpretation, or writing of the report.</p></sec><sec><title>Data Availability</title><p>Requests for access to the anonymized dataset and study materials should be directed to the corresponding author and will be considered on a case-by-case basis in accordance with institutional policies and applicable data protection regulations.</p></sec></notes><fn-group><fn fn-type="con"><p>MALP and C Csajak designed the study; MALP, FG, and C Csajak wrote and submitted the proposal. CL, Christophe Gaudet-Blavignac, Bernard Burnand, FR, ML, Pierre Olivier Lang, and PEB contributed to the development of the study proposal and participated in its revision. CL, PEB, Christophe Gaudet-Blavignac, Nicola Colic, ML, and FR contributed to data extraction and curation. C Coumou, MALP, C Csajak, and FG conducted the study and designed the rule-based algorithms. C Coumou, MALP, C Csajak, FG, and MZ performed the formal analysis. LA contributed to the conceptualization of the rule-based algorithms. MZ and EB designed and implemented the natural language processing algorithms. C Coumou has written the original draft of the manuscript. MALP, C Csajak, FG, and LA contributed to the conceptualization, supervision, and review and editing of the manuscript. The SwissMADE collaborators were consulted on methodological aspects throughout the study. All authors have read and approved the final version of the manuscript.</p></fn><fn fn-type="conflict"><p>PEB reports having received fees and funding from AstraZeneca for matters unrelated to the present study. All other authors declare no competing interests.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ADE</term><def><p>adverse drug event</p></def></def-item><def-item><term id="abb2">CHOP</term><def><p>Swiss Classification of Surgical Procedures</p></def></def-item><def-item><term id="abb3">CHUV</term><def><p>Lausanne University Hospital</p></def></def-item><def-item><term id="abb4">CRNMB</term><def><p>clinically relevant nonmajor bleeding</p></def></def-item><def-item><term id="abb5">EMR</term><def><p>electronic medical record</p></def></def-item><def-item><term id="abb6">HUG</term><def><p>Geneva University Hospital</p></def></def-item><def-item><term id="abb7"><italic>ICD-10-GM</italic></term><def><p><italic>International Statistical Classification of Diseases, 10th Revision, German Modification</italic></p></def></def-item><def-item><term id="abb8">ISTH</term><def><p>International Society on Thrombosis and Haemostasis</p></def></def-item><def-item><term id="abb9">KSB</term><def><p>Baden Cantonal Hospital</p></def></def-item><def-item><term id="abb10">MB</term><def><p>major bleeding</p></def></def-item><def-item><term id="abb11">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb12">NLP</term><def><p>natural language processing</p></def></def-item><def-item><term id="abb13">PPV</term><def><p>positive predictive value</p></def></def-item><def-item><term id="abb14">SDA</term><def><p>structured data algorithms</p></def></def-item><def-item><term id="abb15">STROBE</term><def><p>Strengthening the Reporting of Observational Studies in Epidemiology</p></def></def-item><def-item><term id="abb16">USZ</term><def><p>Z&#x00FC;rich University Hospital</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jennings</surname><given-names>ELM</given-names> </name><name name-style="western"><surname>Murphy</surname><given-names>KD</given-names> </name><name name-style="western"><surname>Gallagher</surname><given-names>P</given-names> </name><name name-style="western"><surname>O&#x2019;Mahony</surname><given-names>D</given-names> </name></person-group><article-title>In-hospital adverse drug reactions in older adults; prevalence, presentation and associated drugs-a systematic review and meta-analysis</article-title><source>Age Ageing</source><year>2020</year><month>10</month><day>23</day><volume>49</volume><issue>6</issue><fpage>948</fpage><lpage>958</lpage><pub-id pub-id-type="doi">10.1093/ageing/afaa188</pub-id><pub-id pub-id-type="medline">33022061</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Long</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Brown</surname><given-names>KF</given-names> </name><name name-style="western"><surname>Ames</surname><given-names>D</given-names> </name><name name-style="western"><surname>Vincent</surname><given-names>C</given-names> </name></person-group><article-title>What is known about adverse events in older medical hospital inpatients? A systematic review of the literature</article-title><source>Int J Qual Health Care</source><year>2013</year><month>10</month><volume>25</volume><issue>5</issue><fpage>542</fpage><lpage>554</lpage><pub-id pub-id-type="doi">10.1093/intqhc/mzt056</pub-id><pub-id pub-id-type="medline">23925507</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Andreotti</surname><given-names>F</given-names> </name><name name-style="western"><surname>Rocca</surname><given-names>B</given-names> </name><name name-style="western"><surname>Husted</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Antithrombotic therapy in the elderly: expert position paper of the European Society of Cardiology Working Group on Thrombosis</article-title><source>Eur Heart J</source><year>2015</year><month>12</month><day>7</day><volume>36</volume><issue>46</issue><fpage>3238</fpage><lpage>3249</lpage><pub-id pub-id-type="doi">10.1093/eurheartj/ehv304</pub-id><pub-id pub-id-type="medline">26163482</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hazell</surname><given-names>L</given-names> </name><name name-style="western"><surname>Shakir</surname><given-names>SAW</given-names> </name></person-group><article-title>Under-reporting of adverse drug reactions: a systematic review</article-title><source>Drug Saf</source><year>2006</year><volume>29</volume><issue>5</issue><fpage>385</fpage><lpage>396</lpage><pub-id pub-id-type="doi">10.2165/00002018-200629050-00003</pub-id><pub-id pub-id-type="medline">16689555</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Murff</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Patel</surname><given-names>VL</given-names> </name><name name-style="western"><surname>Hripcsak</surname><given-names>G</given-names> </name><name name-style="western"><surname>Bates</surname><given-names>DW</given-names> </name></person-group><article-title>Detecting adverse events for patient safety research: a review of current methodologies</article-title><source>J Biomed Inform</source><year>2003</year><volume>36</volume><issue>1-2</issue><fpage>131</fpage><lpage>143</lpage><pub-id pub-id-type="doi">10.1016/j.jbi.2003.08.003</pub-id><pub-id pub-id-type="medline">14552854</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dyas</surname><given-names>AR</given-names> </name><name name-style="western"><surname>Zhuang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Meguid</surname><given-names>RA</given-names> </name><etal/></person-group><article-title>Development and validation of a model for surveillance of postoperative bleeding complications using structured electronic health records data</article-title><source>Surgery</source><year>2022</year><month>12</month><volume>172</volume><issue>6</issue><fpage>1728</fpage><lpage>1732</lpage><pub-id pub-id-type="doi">10.1016/j.surg.2022.08.021</pub-id><pub-id pub-id-type="medline">36150923</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kashkoush</surname><given-names>J</given-names> </name><name name-style="western"><surname>Gupta</surname><given-names>M</given-names> </name><name name-style="western"><surname>Meissner</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Nielsen</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Kirchner</surname><given-names>HL</given-names> </name><name name-style="western"><surname>Garg</surname><given-names>T</given-names> </name></person-group><article-title>Performance characteristics of a rule-based electronic health record algorithm to identify patients with gross and microscopic hematuria</article-title><source>Methods Inf Med</source><year>2023</year><month>12</month><volume>62</volume><issue>5-06</issue><fpage>183</fpage><lpage>192</lpage><pub-id pub-id-type="doi">10.1055/a-2165-5552</pub-id><pub-id pub-id-type="medline">37666279</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hung</surname><given-names>CY</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>CH</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>CS</given-names> </name><name name-style="western"><surname>Li</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>CC</given-names> </name></person-group><article-title>Predicting gastrointestinal bleeding events from multimodal in-hospital electronic health records using deep fusion networks</article-title><source>Annu Int Conf IEEE Eng Med Biol Soc</source><year>2019</year><month>07</month><volume>2019</volume><fpage>2447</fpage><lpage>2450</lpage><pub-id pub-id-type="doi">10.1109/EMBC.2019.8857244</pub-id><pub-id pub-id-type="medline">31946393</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Salas</surname><given-names>M</given-names> </name><name name-style="western"><surname>Petracek</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yalamanchili</surname><given-names>P</given-names> </name><etal/></person-group><article-title>The use of artificial intelligence in pharmacovigilance: a systematic review of the literature</article-title><source>Pharmaceut Med</source><year>2022</year><month>10</month><volume>36</volume><issue>5</issue><fpage>295</fpage><lpage>306</lpage><pub-id pub-id-type="doi">10.1007/s40290-022-00441-z</pub-id><pub-id pub-id-type="medline">35904529</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shung</surname><given-names>D</given-names> </name><name name-style="western"><surname>Tsay</surname><given-names>C</given-names> </name><name name-style="western"><surname>Laine</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Early identification of patients with acute gastrointestinal bleeding using natural language processing and decision rules</article-title><source>J Gastroenterol Hepatol</source><year>2021</year><month>06</month><volume>36</volume><issue>6</issue><fpage>1590</fpage><lpage>1597</lpage><pub-id pub-id-type="doi">10.1111/jgh.15313</pub-id><pub-id pub-id-type="medline">33105045</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>R</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>B</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Detection of bleeding events in electronic health record notes using convolutional neural network models enhanced with recurrent neural network autoencoders: deep learning approach</article-title><source>JMIR Med Inform</source><year>2019</year><month>02</month><day>8</day><volume>7</volume><issue>1</issue><fpage>e10788</fpage><pub-id pub-id-type="doi">10.2196/10788</pub-id><pub-id pub-id-type="medline">30735140</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mitra</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rawat</surname><given-names>BPS</given-names> </name><name name-style="western"><surname>McManus</surname><given-names>DD</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>H</given-names> </name></person-group><article-title>Relation classification for bleeding events from electronic health records using deep learning systems: an empirical study</article-title><source>JMIR Med Inform</source><year>2021</year><month>07</month><day>2</day><volume>9</volume><issue>7</issue><fpage>e27527</fpage><pub-id pub-id-type="doi">10.2196/27527</pub-id><pub-id pub-id-type="medline">34255697</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Taggart</surname><given-names>M</given-names> </name><name name-style="western"><surname>Chapman</surname><given-names>WW</given-names> </name><name name-style="western"><surname>Steinberg</surname><given-names>BA</given-names> </name><etal/></person-group><article-title>Comparison of 2 natural language processing methods for identification of bleeding among critically Ill patients</article-title><source>JAMA Netw Open</source><year>2018</year><month>10</month><day>5</day><volume>1</volume><issue>6</issue><fpage>e183451</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2018.3451</pub-id><pub-id pub-id-type="medline">30646240</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Walker</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Watson</surname><given-names>C</given-names> </name><name name-style="western"><surname>Butcher</surname><given-names>R</given-names> </name><name name-style="western"><surname>Abedin</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Yandell</surname><given-names>M</given-names> </name><name name-style="western"><surname>Shah</surname><given-names>RU</given-names> </name></person-group><article-title>Use of commercially available natural language processing software to identify bleeding from the medical record</article-title><source>medRxiv</source><comment>Preprint posted online on  Nov 19, 2021</comment><pub-id pub-id-type="doi">10.1101/2021.11.19.21266586</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yap</surname><given-names>AJY</given-names> </name><name name-style="western"><surname>Teo</surname><given-names>DCH</given-names> </name><name name-style="western"><surname>Ang</surname><given-names>PS</given-names> </name><etal/></person-group><article-title>Validation of a major and clinically relevant nonmajor bleeding phenotyping algorithm on electronic health records</article-title><source>Pharmacoepidemiol Drug Saf</source><year>2024</year><month>08</month><volume>33</volume><issue>8</issue><fpage>e5875</fpage><pub-id pub-id-type="doi">10.1002/pds.5875</pub-id><pub-id pub-id-type="medline">39090800</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hung</surname><given-names>LC</given-names> </name><name name-style="western"><surname>Su</surname><given-names>YY</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>WT</given-names> </name><name name-style="western"><surname>Sung</surname><given-names>SF</given-names> </name></person-group><article-title>Clinical narratives as a predictor for prognosticating functional outcomes after intracerebral hemorrhage</article-title><source>J Neurol Sci</source><year>2023</year><month>10</month><day>15</day><volume>453</volume><fpage>120807</fpage><pub-id pub-id-type="doi">10.1016/j.jns.2023.120807</pub-id><pub-id pub-id-type="medline">37717279</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Jiang</surname><given-names>M</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>A comparative study of different methods for automatic identification of clopidogrel-induced bleedings in electronic health records</article-title><source>AMIA Jt Summits Transl Sci Proc</source><year>2017</year><volume>2017</volume><fpage>185</fpage><lpage>192</lpage><pub-id pub-id-type="medline">28815128</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Deng</surname><given-names>B</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Development and validation of an automatic system for intracerebral hemorrhage medical text recognition and treatment plan output</article-title><source>Front Aging Neurosci</source><year>2022</year><volume>14</volume><fpage>798132</fpage><pub-id pub-id-type="doi">10.3389/fnagi.2022.798132</pub-id><pub-id pub-id-type="medline">35462698</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hansen</surname><given-names>RS</given-names> </name><name name-style="western"><surname>Lynggaard</surname><given-names>RB</given-names> </name><name name-style="western"><surname>Laursen</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Lykke</surname><given-names>FM</given-names> </name><name name-style="western"><surname>Vinholt</surname><given-names>PJ</given-names> </name></person-group><article-title>Identification of hematuria with a natural language processing model and validation of hematuria diagnosecodes</article-title><source>Thromb Res</source><year>2024</year><month>12</month><volume>244</volume><fpage>109182</fpage><pub-id pub-id-type="doi">10.1016/j.thromres.2024.109182</pub-id><pub-id pub-id-type="medline">39426095</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mehran</surname><given-names>R</given-names> </name><name name-style="western"><surname>Rao</surname><given-names>SV</given-names> </name><name name-style="western"><surname>Bhatt</surname><given-names>DL</given-names> </name><etal/></person-group><article-title>Standardized bleeding definitions for cardiovascular clinical trials: a consensus report from the Bleeding Academic Research Consortium</article-title><source>Circulation</source><year>2011</year><month>06</month><day>14</day><volume>123</volume><issue>23</issue><fpage>2736</fpage><lpage>2747</lpage><pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.110.009449</pub-id><pub-id pub-id-type="medline">21670242</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="web"><article-title>Le CHUV en chiffres [Web Page in French]</article-title><source>Centre Hospitalier Universitaire Vaudois</source><year>2023</year><access-date>2026-01-10</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.chuv.ch/fr/a-propos/le-chuv-en-chiffres">https://www.chuv.ch/fr/a-propos/le-chuv-en-chiffres</ext-link></comment></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="web"><article-title>Facts, figures and dates</article-title><source>H&#x00F4;pitaux Universitaires De Gen&#x00E8;ve</source><access-date>2026-01-10</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.hug.ch/en/facts-figures-and-dates">https://www.hug.ch/en/facts-figures-and-dates</ext-link></comment></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="web"><article-title>About the USZ 2025</article-title><source>Universit&#x00E4;ts Spital Z&#x00FC;rich</source><access-date>2025-10-07</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.usz.ch/en/about-university-hospital-zurich">https://www.usz.ch/en/about-university-hospital-zurich</ext-link></comment></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="web"><article-title>KSB weiterhin auf wachstumskurs [Web Page in German]</article-title><source>Kantonsspital Baden</source><year>2024</year><access-date>2026-01-10</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.kantonsspitalbaden.ch/news/ksb-weiterhin-auf-wachstumskurs">https://www.kantonsspitalbaden.ch/news/ksb-weiterhin-auf-wachstumskurs</ext-link></comment></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gaspar</surname><given-names>F</given-names> </name><name name-style="western"><surname>Lutters</surname><given-names>M</given-names> </name><name name-style="western"><surname>Beeler</surname><given-names>PE</given-names> </name><etal/></person-group><article-title>Automatic detection of adverse drug events in geriatric care: study proposal</article-title><source>JMIR Res Protoc</source><year>2022</year><month>11</month><day>15</day><volume>11</volume><issue>11</issue><fpage>e40456</fpage><pub-id pub-id-type="doi">10.2196/40456</pub-id><pub-id pub-id-type="medline">36378522</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schulman</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kearon</surname><given-names>C</given-names> </name><collab>Subcommittee on Control of Anticoagulation of the Scientific and Standardization Committee of the International Society on Thrombosis and Haemostasis</collab></person-group><article-title>Definition of major bleeding in clinical investigations of antihemostatic medicinal products in non-surgical patients</article-title><source>J Thromb Haemost</source><year>2005</year><month>04</month><volume>3</volume><issue>4</issue><fpage>692</fpage><lpage>694</lpage><pub-id pub-id-type="doi">10.1111/j.1538-7836.2005.01204.x</pub-id><pub-id pub-id-type="medline">15842354</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kaatz</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ahmad</surname><given-names>D</given-names> </name><name name-style="western"><surname>Spyropoulos</surname><given-names>AC</given-names> </name><name name-style="western"><surname>Schulman</surname><given-names>S</given-names> </name><collab>Subcommittee on Control of Anticoagulation</collab></person-group><article-title>Definition of clinically relevant non-major bleeding in studies of anticoagulants in atrial fibrillation and venous thromboembolic disease in non-surgical patients: communication from the SSC of the ISTH</article-title><source>J Thromb Haemost</source><year>2015</year><month>11</month><volume>13</volume><issue>11</issue><fpage>2119</fpage><lpage>2126</lpage><pub-id pub-id-type="doi">10.1111/jth.13140</pub-id><pub-id pub-id-type="medline">26764429</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Honnibal</surname><given-names>M</given-names> </name><name name-style="western"><surname>Montani</surname><given-names>I</given-names> </name></person-group><article-title>spaCy 2: natural language understanding with Bloom embeddings, convolutional neural networks and incremental parsing</article-title><source>Sentometrics Res</source><year>2017</year><access-date>2025-08-21</access-date><volume>7</volume><issue>1</issue><fpage>411</fpage><lpage>420</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://sentometrics-research.com/publication/72/">https://sentometrics-research.com/publication/72/</ext-link></comment></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gaspar</surname><given-names>F</given-names> </name><name name-style="western"><surname>Zayene</surname><given-names>M</given-names> </name><name name-style="western"><surname>Coumau</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Natural language processing and ICD-10 coding for detecting bleeding events in discharge summaries: comparative cross-sectional study</article-title><source>JMIR Med Inform</source><year>2025</year><month>08</month><day>29</day><volume>13</volume><fpage>e67837</fpage><pub-id pub-id-type="doi">10.2196/67837</pub-id><pub-id pub-id-type="medline">40882207</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Taff&#x00E9;</surname><given-names>P</given-names> </name><name name-style="western"><surname>Halfon</surname><given-names>P</given-names> </name><name name-style="western"><surname>Ghali</surname><given-names>WA</given-names> </name><name name-style="western"><surname>Burnand</surname><given-names>B</given-names> </name><collab>International Methodology Consortium for Coded Health Information (IMECCHI)</collab></person-group><article-title>Test result-based sampling: an efficient design for estimating the accuracy of patient safety indicators</article-title><source>Med Decis Making</source><year>2012</year><volume>32</volume><issue>1</issue><fpage>E1</fpage><lpage>12</lpage><pub-id pub-id-type="doi">10.1177/0272989X11426176</pub-id><pub-id pub-id-type="medline">22065144</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Landis</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Koch</surname><given-names>GG</given-names> </name></person-group><article-title>The measurement of observer agreement for categorical data</article-title><source>Biometrics</source><year>1977</year><month>03</month><volume>33</volume><issue>1</issue><fpage>159</fpage><lpage>174</lpage><pub-id pub-id-type="doi">10.2307/2529310</pub-id><pub-id pub-id-type="medline">843571</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="report"><article-title>The use of the WHO-UMC system for standardised case causality assessment</article-title><year>2018</year><access-date>2026-01-10</access-date><publisher-name>World Health Organization - Uppsala Monitoring Centre</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/docs/default-source/medicines/pharmacovigilance/whocausality-assessment.pdf">https://www.who.int/docs/default-source/medicines/pharmacovigilance/whocausality-assessment.pdf</ext-link></comment></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Charlson</surname><given-names>ME</given-names> </name><name name-style="western"><surname>Pompei</surname><given-names>P</given-names> </name><name name-style="western"><surname>Ales</surname><given-names>KL</given-names> </name><name name-style="western"><surname>MacKenzie</surname><given-names>CR</given-names> </name></person-group><article-title>A new method of classifying prognostic comorbidity in longitudinal studies: development and validation</article-title><source>J Chronic Dis</source><year>1987</year><volume>40</volume><issue>5</issue><fpage>373</fpage><lpage>383</lpage><pub-id pub-id-type="doi">10.1016/0021-9681(87)90171-8</pub-id><pub-id pub-id-type="medline">3558716</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Elixhauser</surname><given-names>A</given-names> </name><name name-style="western"><surname>Steiner</surname><given-names>C</given-names> </name><name name-style="western"><surname>Harris</surname><given-names>DR</given-names> </name><name name-style="western"><surname>Coffey</surname><given-names>RM</given-names> </name></person-group><article-title>Comorbidity measures for use with administrative data</article-title><source>Med Care</source><year>1998</year><month>01</month><volume>36</volume><issue>1</issue><fpage>8</fpage><lpage>27</lpage><pub-id pub-id-type="doi">10.1097/00005650-199801000-00004</pub-id><pub-id pub-id-type="medline">9431328</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ferrazzini</surname><given-names>E</given-names> </name><name name-style="western"><surname>M&#x00E9;an</surname><given-names>M</given-names> </name><name name-style="western"><surname>Stalder</surname><given-names>O</given-names> </name><name name-style="western"><surname>Limacher</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rodondi</surname><given-names>N</given-names> </name><name name-style="western"><surname>Aujesky</surname><given-names>D</given-names> </name></person-group><article-title>Incidence and clinical impact of bleeding events in older patients with acute venous thromboembolism</article-title><source>Blood Adv</source><year>2023</year><month>01</month><day>24</day><volume>7</volume><issue>2</issue><fpage>205</fpage><lpage>213</lpage><pub-id pub-id-type="doi">10.1182/bloodadvances.2022007263</pub-id><pub-id pub-id-type="medline">35381071</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>G&#x00F3;mez-Cuervo</surname><given-names>C</given-names> </name><name name-style="western"><surname>Rivas</surname><given-names>A</given-names> </name><name name-style="western"><surname>Vison&#x00E0;</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Predicting the risk for major bleeding in elderly patients with venous thromboembolism using the Charlson index. Findings from the RIETE</article-title><source>J Thromb Thrombolysis</source><year>2021</year><month>05</month><volume>51</volume><issue>4</issue><fpage>1017</fpage><lpage>1025</lpage><pub-id pub-id-type="doi">10.1007/s11239-020-02274-6</pub-id><pub-id pub-id-type="medline">32945982</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Poli</surname><given-names>D</given-names> </name><name name-style="western"><surname>Antonucci</surname><given-names>E</given-names> </name><name name-style="western"><surname>Bert&#x00F9;</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Very elderly patients with venous thromboembolism on oral anticoagulation with VKAs or DOACs: results from the prospective multicenter START2-Register Study</article-title><source>Thromb Res</source><year>2019</year><month>11</month><volume>183</volume><fpage>28</fpage><lpage>32</lpage><pub-id pub-id-type="doi">10.1016/j.thromres.2019.08.024</pub-id><pub-id pub-id-type="medline">31536872</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Prasad</surname><given-names>N</given-names> </name><name name-style="western"><surname>Lau</surname><given-names>ECY</given-names> </name><name name-style="western"><surname>Wojt</surname><given-names>I</given-names> </name><name name-style="western"><surname>Penm</surname><given-names>J</given-names> </name><name name-style="western"><surname>Dai</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>ECK</given-names> </name></person-group><article-title>Prevalence of and risk factors for drug-related readmissions in older adults: a systematic review and meta-analysis</article-title><source>Drugs Aging</source><year>2024</year><month>01</month><volume>41</volume><issue>1</issue><fpage>1</fpage><lpage>11</lpage><pub-id pub-id-type="doi">10.1007/s40266-023-01076-8</pub-id><pub-id pub-id-type="medline">37864770</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shehab</surname><given-names>N</given-names> </name><name name-style="western"><surname>Ziemba</surname><given-names>R</given-names> </name><name name-style="western"><surname>Campbell</surname><given-names>KN</given-names> </name><etal/></person-group><article-title>Assessment of ICD-10-CM code assignment validity for case finding of outpatient anticoagulant-related bleeding among Medicare beneficiaries</article-title><source>Pharmacoepidemiol Drug Saf</source><year>2019</year><month>07</month><volume>28</volume><issue>7</issue><fpage>951</fpage><lpage>964</lpage><pub-id pub-id-type="doi">10.1002/pds.4783</pub-id><pub-id pub-id-type="medline">31144403</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Joos</surname><given-names>C</given-names> </name><name name-style="western"><surname>Lawrence</surname><given-names>K</given-names> </name><name name-style="western"><surname>Jones</surname><given-names>AE</given-names> </name><name name-style="western"><surname>Johnson</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Witt</surname><given-names>DM</given-names> </name></person-group><article-title>Accuracy of ICD-10 codes for identifying hospitalizations for acute anticoagulation therapy-related bleeding events</article-title><source>Thromb Res</source><year>2019</year><month>09</month><volume>181</volume><fpage>71</fpage><lpage>76</lpage><pub-id pub-id-type="doi">10.1016/j.thromres.2019.07.021</pub-id><pub-id pub-id-type="medline">31357146</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mitra</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rawat</surname><given-names>BPS</given-names> </name><name name-style="western"><surname>McManus</surname><given-names>D</given-names> </name><name name-style="western"><surname>Kapoor</surname><given-names>A</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>H</given-names> </name></person-group><article-title>Bleeding entity recognition in electronic health records: a comprehensive analysis of end-to-end systems</article-title><source>AMIA Annu Symp Proc</source><year>2020</year><volume>2020</volume><fpage>860</fpage><lpage>869</lpage><pub-id pub-id-type="medline">33936461</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Lv</surname><given-names>M</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Severe bleeding risk of direct oral anticoagulants versus vitamin K antagonists for stroke prevention and treatment in patients with atrial fibrillation: a systematic review and network meta-analysis</article-title><source>Cardiovasc Drugs Ther</source><year>2023</year><month>04</month><volume>37</volume><issue>2</issue><fpage>363</fpage><lpage>377</lpage><pub-id pub-id-type="doi">10.1007/s10557-021-07232-9</pub-id><pub-id pub-id-type="medline">34436708</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mant</surname><given-names>J</given-names> </name></person-group><article-title>Process versus outcome indicators in the assessment of quality of health care</article-title><source>Int J Qual Health Care</source><year>2001</year><month>12</month><volume>13</volume><issue>6</issue><fpage>475</fpage><lpage>480</lpage><pub-id pub-id-type="doi">10.1093/intqhc/13.6.475</pub-id><pub-id pub-id-type="medline">11769750</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>International definitions of major bleeding and clinically relevant nonmajor bleeding: a comparative overview.</p><media xlink:href="jmir_v28i1e77809_app1.docx" xlink:title="DOCX File, 68 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>List of synonyms for major bleeding and clinically relevant nonmajor bleeding cases.</p><media xlink:href="jmir_v28i1e77809_app2.docx" xlink:title="DOCX File, 17 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Interrater reliability assessment among manual reviewers.</p><media xlink:href="jmir_v28i1e77809_app3.docx" xlink:title="DOCX File, 18 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Causality assessment between antithrombotic treatment and bleeding.</p><media xlink:href="jmir_v28i1e77809_app4.docx" xlink:title="DOCX File, 16 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Overview of missing values per variable used in major bleeding and clinically relevant nonmajor bleeding algorithms.</p><media xlink:href="jmir_v28i1e77809_app5.docx" xlink:title="DOCX File, 15 KB"/></supplementary-material><supplementary-material id="app6"><label>Multimedia Appendix 6</label><p>Comparison of clinical characteristics of Lausanne University Hospital 2015-2016 vs 2021-2022 cohorts.</p><media xlink:href="jmir_v28i1e77809_app6.docx" xlink:title="DOCX File, 23 KB"/></supplementary-material><supplementary-material id="app7"><label>Checklist 1</label><p>STROBE checklist.</p><media xlink:href="jmir_v28i1e77809_app7.docx" xlink:title="DOCX File, 24 KB"/></supplementary-material></app-group></back></article>