<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id><journal-id journal-id-type="publisher-id">jmir</journal-id><journal-id journal-id-type="index">1</journal-id><journal-title>Journal of Medical Internet Research</journal-title><abbrev-journal-title>J Med Internet Res</abbrev-journal-title><issn pub-type="epub">1438-8871</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v27i1e71113</article-id><article-id pub-id-type="doi">10.2196/71113</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Automated Extraction of Mortality Information From Publicly Available Sources Using Large Language Models: Development and Evaluation Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Al-Garadi</surname><given-names>Mohammed</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>LeNoue-Newton</surname><given-names>Michele</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Matheny</surname><given-names>Michael E</given-names></name><degrees>MD, MS, MPH</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>McPheeters</surname><given-names>Melissa</given-names></name><degrees>MPH, PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Whitaker</surname><given-names>Jill M</given-names></name><degrees>MSN</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Deere</surname><given-names>Jessica A</given-names></name><degrees>MPH</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>McLemore</surname><given-names>Michael F</given-names></name><degrees>BSN, RN</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Westerman</surname><given-names>Dax</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Khan</surname><given-names>Mirza S</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Hern&#x00E1;ndez-Mu&#x00F1;oz</surname><given-names>Jos&#x00E9; J</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Wang</surname><given-names>Xi</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kuzucan</surname><given-names>Aida</given-names></name><degrees>PharmD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Desai</surname><given-names>Rishi J</given-names></name><degrees>MS, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Reeves</surname><given-names>Ruth</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Biomedical Informatics, Vanderbilt University Medical Center</institution><addr-line>2525 West End Avenue</addr-line><addr-line>Nashville</addr-line><addr-line>TN</addr-line><country>United States</country></aff><aff id="aff2"><institution/><addr-line>Research Triangle Park</addr-line><addr-line>NC</addr-line><country>United States</country></aff><aff id="aff3"><institution>United States Food and Drug Administration</institution><addr-line>Silver Spring</addr-line><addr-line>MD</addr-line><country>United States</country></aff><aff id="aff4"><institution>Harvard University</institution><addr-line>Cambridge</addr-line><addr-line>MA</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Sarvestan</surname><given-names>Javad</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Heemelaar</surname><given-names>J C</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Young</surname><given-names>Peter W</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to  Mohammed Al-Garadi, PhD, Department of Biomedical Informatics, Vanderbilt University Medical Center, 2525 West End Avenue, Nashville, TN, 37203, United States, 1 2139151696; <email>mohammed.a.al-garadi@vumc.org</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>18</day><month>8</month><year>2025</year></pub-date><volume>27</volume><elocation-id>e71113</elocation-id><history><date date-type="received"><day>10</day><month>01</month><year>2025</year></date><date date-type="rev-recd"><day>15</day><month>04</month><year>2025</year></date><date date-type="accepted"><day>16</day><month>04</month><year>2025</year></date></history><copyright-statement>&#x00A9; Mohammed Al-Garadi, Michele LeNoue-Newton, Michael E Matheny, Melissa McPheeters, Jill M Whitaker, Jessica A Deere, Michael F McLemore, Dax Westerman, Mirza S Khan, Jos&#x00E9; J Hern&#x00E1;ndez-Mu&#x00F1;oz, Xi Wang, Aida Kuzucan, Rishi J Desai, Ruth Reeves. Originally published in the Journal of Medical Internet Research (<ext-link ext-link-type="uri" xlink:href="https://www.jmir.org">https://www.jmir.org</ext-link>), 18.8.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.jmir.org/">https://www.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.jmir.org/2025/1/e71113"/><abstract><sec><title>Background</title><p>Mortality is a critical variable in health care research, especially for evaluating medical product safety and effectiveness. However, inconsistencies in the availability and timeliness of death date and cause of death (CoD) information present significant challenges. Conventional sources such as the National Death Index and electronic health records often experience data lags, missing fields, or incomplete coverage, limiting their utility in time-sensitive or large-scale studies. With the growing use of social media, crowdfunding platforms, and web-based memorials, publicly available digital content has emerged as a potential supplementary source for mortality surveillance. Despite this potential, accurate tools for extracting mortality information from such unstructured data sources remain underdeveloped.</p></sec><sec><title>Objective</title><p>The aim of the study is to develop scalable approaches using natural language processing (NLP) and large language models (LLMs) for the extraction of mortality information from publicly available web-based data sources, including social media platforms, crowdfunding websites, and web-based obituaries, and to evaluate their performance across various sources.</p></sec><sec sec-type="methods"><title>Methods</title><p>Data were collected from public posts on X (formerly known as Twitter), GoFundMe campaigns, memorial websites (EverLoved and TributeArchive), and web-based obituaries from 2015 to 2022, focusing on US-based content relevant to mortality. We developed an NLP pipeline using transformer-based models to extract key mortality information such as decedent names, dates of birth, and dates of death. We then used a few-shot learning (FSL) approach with LLMs to identify primary and secondary CoDs. Model performance was assessed using precision, recall, <italic>F</italic><sub>1</sub>-score, and accuracy metrics, with human-annotated labels serving as the reference standard for the transformer-based model and a human adjudicator blinded to the labeling source for the FSL model reference standard.</p></sec><sec sec-type="results"><title>Results</title><p>The best-performing model obtained a microaveraged <italic>F</italic><sub>1</sub>-score of 0.88 (95% CI 0.86&#x2010;0.90) in extracting mortality information. The FSL-LLM approach demonstrated high accuracy in identifying primary CoD across various web-based sources. For GoFundMe, the FSL-LLM achieved 95.9% accuracy for primary cause identification compared to 97.9% for human annotators. In obituaries, FSL-LLM accuracy was 96.5% for primary causes, while human accuracy was 99%. For memorial websites, FSL-LLM achieved 98% accuracy for primary causes, with human accuracy at 99.5%.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study demonstrates the feasibility of using advanced NLP and LLM techniques to extract mortality data from publicly available web-based sources. These methods can significantly enhance the timeliness, completeness, and granularity of mortality surveillance, offering a valuable complement to traditional data systems. By enabling earlier detection of mortality signals and improving CoD classification across large populations, this approach may support more responsive public health monitoring and medical product safety assessments. Further work is needed to validate these findings in real-world health care settings and facilitate the integration of digital data sources into national public health surveillance systems.</p></sec></abstract><kwd-group><kwd>natural language processing</kwd><kwd>NLP</kwd><kwd>large language model</kwd><kwd>LLM</kwd><kwd>mortality data</kwd><kwd>few-shot learning</kwd><kwd>public health informatics</kwd><kwd>social media analysis</kwd><kwd>obituaries</kwd><kwd>automated surveillance</kwd><kwd>health care analytics</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Mortality is a critical variable in health care research, and all-cause mortality is one of the most studied end points [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref4">4</xref>]. Accurate identification of the fact, timing, and cause of death (CoD) is essential for various types of medical research, including clinical trials, observational studies, and postmarketing surveillance programs such as the US Food and Drug Administration (FDA) Sentinel System [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref8">8</xref>].</p><p>A recent report identified limitations in the availability of date and CoD information as a major cause for study insufficiency when considering the use of the Sentinel Active Risk Identification and Analysis system to address regulatory questions [<xref ref-type="bibr" rid="ref9">9</xref>]. Failing to identify deaths may result in substantial underestimation of mortality outcomes related to medical products, so efforts to identify additional data sources to supplement current systems have far-reaching consequences. Vital statistics data, collected in the United States through death certificates and submitted at the state level, serve as the &#x201C;reference standard&#x201D; for mortality information. Depending on US state laws (and sometimes the manner of death), death certificates may be completed by coroners, medical examiners, or physicians within the health care system. Once submitted to state systems, death certificate data are forwarded to the Centers for Disease Control and Prevention, which codes the underlying CoD and adds it to national records. However, this process is slow&#x2014;vital statistics data are typically delayed by at least 9 months, and the National Death Index often lags by up to 2 years. There are other data sources for death information, including claims databases and medical records, but each of these sources has limitations [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Claims databases may underrepresent uninsured populations, while medical records often lack standardization between health care providers, complicating data aggregation and comparison [<xref ref-type="bibr" rid="ref12">12</xref>]. In most claims databases, death-related information, including occurrence and CoD, is often incomplete or not directly recorded. Similarly, health care system&#x2013;based data sources, such as electronic health records (EHRs), frequently lack comprehensive mortality data, particularly when patients are not under the care of the health care system at the time of death. This poses significant challenges for researchers and clinicians relying on these data sources for epidemiological studies, outcomes research, and health care quality assessments.</p><p>The rise in the use of social media has introduced potential sources of mortality-related information, including web-based obituaries and the sharing of death information in social networks through Twitter (subsequently rebranded X) and other channels. There is growing precedent for the use of social media in public health and other health-related research, and user posts have been used to track illnesses [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref17">17</xref>], measure behavioral risk factors [<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref22">22</xref>], localize diseases geographically [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>], and analyze symptoms and medication use [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref30">30</xref>]. Nonetheless, a key challenge inherent in social media data for mortality information is the capacity to extract the data and CoD at scale and with replicable methods. These social media sources offer potential advantages in timeliness, context, and coverage compared to traditional mortality data sources.</p><p>In this study, we sought to develop a set of NLP tools to extract both the fact and CoD from publicly available records and to assess the relative information density of illness and death information within these records. These types of data, when combined with other sources, could improve ascertainment in downstream studies that require the use of the facts and causes of mortality among EHR and claims data analyses.</p><p>The innovative approach leverages publicly available data to provide timely insights into population health trends, potentially enabling faster responses to emerging health threats. By linking social media and obituary data with patient records, the system could offer a more comprehensive view of health outcomes and risk factors as well as system evaluation.</p><p>This study highlights the transformative potential of LLMs in comparison to traditional NLP approaches. While earlier methods rely heavily on predefined rules or extensive labeled datasets, LLMs offer greater flexibility through few-shot learning (FSL) and contextual understanding of complex narratives. This capability is especially critical for extracting nuanced mortality information from diverse and informal web-based text, where structure and terminology often vary widely across sources.</p><p>In this study, we developed and evaluated a pipeline combining transformer-based NLP models and FSL with LLMs to extract mortality information, including fact and CoD, from publicly available web-based sources. Our goal was to assess the feasibility, accuracy, and utility of this approach for supplementing traditional mortality data in health care research and surveillance.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview</title><p>We developed and evaluated natural language processing (NLP) techniques to extract mortality information from publicly available web-based sources, focusing on US-related data. The research methodology included data collection, NLP model development, and performance assessment.</p></sec><sec id="s2-2"><title>Data Sources and Study Cohort</title><p>Data were collected from X (formerly known as Twitter), GoFundMe, web-based obituaries (Obituaries), and memorial websites (EverLoved and TributeArchive) between the years 2015 and 2022 in the United States, which are publicly available and aggregated for research purposes in accordance with fair use. The web-based obituary sources provide more robust metadata for determining inclusion criteria than records obtained from Twitter or GoFundMe. Our collection methods, therefore, differed by source.</p><p>Our search on X used around 50 derived keywords (the list is in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) for English-language posts while excluding non-English content. Keywords included terms like &#x201C;death,&#x201D; &#x201C;expired,&#x201D; and &#x201C;deceased.&#x201D; Using Twitter&#x2019;s official research application programming interface, this approach yielded approximately 40 million tweets. Using similar keywords (provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), we identified and retrieved posts from GoFundMe and memorial websites (EverLoved and TributeArchive) containing mortality-related information. For obituaries, we acquired reports from 2015 to 2022, which contained millions of records. For the obituary data sources, we collected structured metadata (eg, first name, last name, date of death, date of birth, and location) and extracted accompanying textual information. NLP techniques were subsequently used on this textual content to supplement or complete missing or incomplete metadata fields. This approach allowed us to maximize the information extracted from each obituary, enhancing the overall quality and completeness of our dataset.</p></sec><sec id="s2-3"><title>Reference Standard</title><p>To construct a human-based reference dataset for training and testing our models, we developed an annotation process that captured the deceased&#x2019;s name, names of related individuals, key dates (including death, birth, and other relevant dates), and CoD. First, annotators were instructed to accurately classify names with postnominals, avoid names in Twitter handles, and use specific relationship attributes for related persons (eg, spouse, sibling, and child). Second, annotated dates included exact, partial, or relative expressions, with clear distinctions for death and birth dates. Third, the CoDs were annotated with attributes indicating assertion (positive, negative, and uncertain) and patient versus nonpatient (reference to the deceased or to someone else). Finally, if no relevant data were found in a document, annotators classified the document as &#x201C;No data.&#x201D;</p><p>A corpus of 4200 notes, 1050 from each of the data sources, was randomly sampled. We split the 4200 annotated posts from all data sources into training (70%), testing (20%), and validation (10%) datasets. The training data contained 81,082 tokens (words), and the test data contained 27,834 tokens (words).</p></sec><sec id="s2-4"><title>Annotation</title><p>The data were annotated by 3 trained nurse annotators who closely followed a detailed annotation guideline, categorizing each post into first and last names, dates of birth, dates of death, and CoD. The training was initiated using records from Twitter, GoFundMe, the memorial website (EverLoved or TributeArchive), and Obituaries, with all 3 annotators independently labeling the same documents in rounds of 15 documents from each source (n=45).</p><p>After each training round of annotation was completed by all 3 members, agreement rates were computed between pairs of annotation sets. The overall interannotator agreement (IAA) was evaluated using Cohen &#x03BA; [<xref ref-type="bibr" rid="ref31">31</xref>], and annotators were required to achieve an overall IAA threshold of 0.80 on the training set before proceeding with the full annotation process. When the targeted threshold was not met, the annotation team performed a consensus annotation over each document in a given annotation round, discussed their differences, and updated or clarified the annotation guidelines. Once trained, each annotator independently labeled a subset of a corpus totaling 4200 documents (1050 per source). To assess reliability, 100 additional documents (25 per source) were randomly assigned to all 3 annotators, and an independent IAA was conducted. The eHOST annotation tool was used to annotate the documents [<xref ref-type="bibr" rid="ref32">32</xref>].</p></sec><sec id="s2-5"><title>Information Density Assessment</title><p>Annotations completed by nurse annotators were used to assess the information density of web-based sources, such as social media platforms like Twitter, to determine if they contained sufficient details for reliable patient linkage and augmentation of date of death in health care systems. Sources with inadequate information were excluded from further analysis. Assessment of CoD availability was completed using the 600 document annotations used in the FSL validation with verification by the nurse adjudicator of CoDs mentioned within the post.</p></sec><sec id="s2-6"><title>NLP Development and Implementation</title><p>We developed in parallel 2 NLP tools for information extraction from the previously described social media sources. First, we adapted 4 deep learning transformer-based methods including Bidirectional Encoder Representations from Transformers (BERT) [<xref ref-type="bibr" rid="ref33">33</xref>], Robustly Optimized BERT Pretraining Approach (RoBERTa) [<xref ref-type="bibr" rid="ref34">34</xref>], A Lite BERT (ALBERT) [<xref ref-type="bibr" rid="ref35">35</xref>], and BERTweet [<xref ref-type="bibr" rid="ref36">36</xref>] to extract the decedent&#x2019;s name, date of birth, and date of death and to exclude any irrelevant dates. The technical pipeline overview for the transformer-based model is illustrated in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Workflow of the natural language processing pipeline development and evaluation process.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e71113_fig01.png"/></fig><p>To identify CoD, we used an FSL approach to leverage an open-source large language model (LLM; <xref ref-type="fig" rid="figure2">Figure 2</xref>). The decision to forgo transformer models for this phase of information extraction was based on the need for a nuanced understanding of both the extracted cause and its contextual relevance in predicting CoD. Instead, we used an iterative prompting strategy incorporating annotated examples and structured guidelines to delineate primary and secondary CoD. High-quality annotation labels, determined by consensus between at least 2 annotators, ensured the reliability of the prompts.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Workflow for few-shot learning and evaluation. LLM: large language model.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e71113_fig02.png"/></fig><p>For example, in the post, &#x201C;Jane Smith died from a severe infection following surgery. She also had diabetes and hypertension, which contributed to her deteriorating health,&#x201D; the main cause would be noted as &#x201C;severe infection following surgery,&#x201D; and the secondary causes as &#x201C;diabetes&#x201D; and &#x201C;hypertension.&#x201D; The initial prompt engineering stage ensures that the LLM properly formulates the type of information to extract or predict. We used the LLaMA model, a 13 GB language model developed by Facebook AI Research, for processing the data [<xref ref-type="bibr" rid="ref37">37</xref>]. LLaMA, which stands for &#x201C;Large Language Model Meta AI,&#x201D; is a foundational language model that exhibits remarkable performance across various NLP tasks [<xref ref-type="bibr" rid="ref37">37</xref>]. A smaller version, such as the 13 GB variant, of the LLaMA model can be run locally on a machine with sufficient computational resources, making it more accessible and efficient for certain applications. We started with 30 randomly selected examples from the manually annotated data (training split) for prompting (the LLM-prompt example is available in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) and 30 for assessing the model&#x2019;s performance, where at least 2 annotators agreed on the annotated instance. The prompts and assessment examples went through several iterations of LLM refinement, totaling 4 iterations, until the identified CoD was correct in most cases across the various assessment sets. The accuracy during the prompting process was evaluated qualitatively to understand where the model performed correctly and where it made errors.</p><p>During the testing phase, we evaluated our final prompting design on a new set of 600 examples. The evaluation process involved 3 steps:</p><list list-type="bullet"><list-item><p>A nurse annotator identified the CoD in these examples following the provided guidelines.</p></list-item><list-item><p>Simultaneously, our refined language model (LLM) automatically extracted the CoD from the same 600 examples.</p></list-item><list-item><p>A second trained nurse, acting as an adjudicator, independently reviewed both sets of results. This review ensured that the annotations adhered to the guidelines and that the primary CoD was accurately identified in each case.</p></list-item></list><p>Following the evaluation, we analyzed the results by determining the accuracy of primary CoD and additional identified causes from both the human annotator and the LLM per the adjudication. We then determined true positives, true negatives, false positives, and false negatives to compute relevant statistical metrics, allowing us to assess the accuracy and effectiveness of both human and automated CoD identification methods.</p></sec><sec id="s2-7"><title>Statistical Metrics for Model Evaluation</title><p>For the transformer-based model evaluation, we calculated sensitivity, positive predictive value, and the <italic>F</italic><sub>1</sub>-score to evaluate model performance, and we computed microaverages for each to compute the average metric for a global measure of performance (all metric definitions are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). We used bootstrap to calculate the CI by resampling the test set, calculating the required metrics for each resample, and using percentiles of these metrics to form the CI. We also assessed the information density of web-based posts from each data source to determine their adequacy for reliable patient linkage and mortality information augmentation in health care systems.</p><p>For the LLM CoD information extraction module, we calculated the <italic>F</italic><sub>1</sub>-score, accuracy, precision, and recall for the primary CoD. However, for all potential CoD, due to the variation in the number of causes and the challenge of measuring performance using traditional NLP metrics, we asked the adjudicator to qualitatively assess the number of cases where the LLM correctly identified all the contributing CoD mentioned in the posts and to determine if the LLM and human annotators correctly identified the primary CoD. As such, we addressed the ambiguity of using a static output for each social media post. The adjudicator focused on whether the predicted CoD was accurate, regardless of whether it was explicitly mentioned in the post or inferred from the overall understanding of the post.</p><p>Phrases classified as &#x201C;No CoD&#x201D; indicated no specific medical CoD. These included &#x201C;brief or sudden or extended or chronic illness,&#x201D; &#x201C;unexpected&#x201D; or &#x201C;sudden death or passing,&#x201D; &#x201C;natural causes,&#x201D; &#x201C;no mention&#x201D; of cause, &#x201C;none,&#x201D; and &#x201C;unknown or unspecified reasons or cause.&#x201D; Posts containing only such phrases were categorized as &#x201C;No CoD.&#x201D; Correct identification of these cases by the language model counted as true negatives in the CoD identification process. This approach ensured that vague or nonmedical descriptions were not misclassified as specific CoDs.</p></sec><sec id="s2-8"><title>Application of NLP and Final Data Collection</title><p>The final phase of our study involved compiling the extracted data into a comprehensive dataset ready for analysis. We applied a series of cleaning filters and NLP techniques to ensure that only documents with reliable mortality-related information were included. This thorough process resulted in a dataset. This dataset, enriched with mortality information from various sources, is poised to serve as a valuable resource for public health surveillance and future research efforts.</p></sec><sec id="s2-9"><title>Ethical Considerations</title><p>Given its focus on public health surveillance using open-source information, this research qualifies for exemption from FDA and Vanderbilt University Medical Center Institutional Review Board oversight. This study used publicly available web-based data and did not involve any interaction with human participants. Data collection and analysis were conducted in accordance with ethical guidelines and fair use principles for research purposes.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Annotation IAA</title><p>Overall IAA with respect to GoFundMe achieved a 92.5% agreement rate in the final iteration, while the IAA within Twitter data maintained an 85.7% agreement rate after 3 rounds of assessment. IAA achieved within data sourced from the obituary websites demonstrated strong overall agreement, with a 91.5% agreement rate after the third round of assessment.</p></sec><sec id="s3-2"><title>Information Density in Social Media</title><p>Analysis of information density in web-based posts revealed varying levels of utility for patient linkage and mortality information augmentation in health care systems. Among the examined sources, 3 demonstrated high information density for annotated names, ranging from 87.81% to 97.81% (<xref ref-type="table" rid="table1">Table 1</xref>). These sources provided sufficient detail for reliable patient identification and mortality data enhancement, whereas X had low information density for patient identification and was excluded from subsequent analysis.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Information density of annotated names across different web-based public sources.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Source type</td><td align="left" valign="bottom">Names annotated, n (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Twitter</td><td align="left" valign="top">13.71</td></tr><tr><td align="left" valign="top">Obituary</td><td align="left" valign="top">96.48</td></tr><tr><td align="left" valign="top">GoFundMe</td><td align="left" valign="top">87.81</td></tr><tr><td align="left" valign="top">Memorial Website</td><td align="left" valign="top">97.81</td></tr></tbody></table></table-wrap></sec><sec id="s3-3"><title>Extracting Mortality Information Results</title><p>Evaluated on the manually annotated test data, the RoBERTa model achieved the highest overall performance for extracting the targeted information, with a microaveraged <italic>F</italic><sub>1</sub>-score of 0.88 (95% CI 0.86&#x2010;0.90; <xref ref-type="table" rid="table2">Table 2</xref>). Confusion matrices are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. This model outperformed others in all 3 tasks, achieving an <italic>F</italic><sub>1</sub>-score of 0.85 (95% CI 0.84&#x2010;0.86) for decedent name, 0.89 (95% CI 0.88&#x2010;0.90) for date of death, and 0.94 (95% CI 0.92&#x2010;0.94) for date of birth. The ALBERT model attained an <italic>F</italic><sub>1</sub>-score of 0.87 (95% CI 0.86&#x2010;0.89) for date of death, 0.83 (95% CI 0.82&#x2010;0.86) for decedent name, and 0.91 (95% CI 0.90&#x2010;0.93) for date of birth. BERTweet achieved an <italic>F</italic><sub>1</sub>-score of 0.90 (95% CI 0.89&#x2010;0.91) for date of birth, 0.82 (95% CI 0.81&#x2010;0.83) for decedent name, and 0.85 (95% CI 0.84&#x2010;0.86) for date of death. BERT&#x2019;s performance was marginally lower, with <italic>F</italic><sub>1</sub>-scores of 0.81 (95% CI 0.80&#x2010;0.83), 0.84 (95% CI 0.82&#x2010;0.86), and 0.89 (95% CI 0.88&#x2010;0.90) for decedent name, date of death, and date of birth, respectively.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Performance comparison of fine-tuned transformer models (on named entity recognition tasks: decedent name, date of death, and date of birth).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom" colspan="3">RoBERTa<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="bottom" colspan="3">BERT<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="bottom" colspan="3">ALBERT<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td><td align="left" valign="bottom" colspan="3">BERTweet</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Precision (PPV<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup>)</td><td align="left" valign="top">Recall (sensitivity)</td><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score (95% CI)</td><td align="left" valign="top">Precision (PPV)</td><td align="left" valign="top">Recall (sensitivity)</td><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score (95% CI)</td><td align="left" valign="top">Precision (PPV)</td><td align="left" valign="top">Recall (sensitivity)</td><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score (95% CI)</td><td align="left" valign="top">Precision (PPV)</td><td align="left" valign="top">Recall (sensitivity)</td><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score (95% CI)</td></tr></thead><tbody><tr><td align="left" valign="top">Decedent name</td><td align="left" valign="top">0.86</td><td align="left" valign="top">0.84</td><td align="left" valign="top">0.85<break/>(0.84&#x2010;0.86)</td><td align="left" valign="top">0.81</td><td align="left" valign="top">0.80</td><td align="left" valign="top">0.81<break/>(0.80&#x2010;0.83)</td><td align="left" valign="top">0.84</td><td align="left" valign="top">0.82</td><td align="left" valign="top">0.83<break/>(0.82&#x2010;0.86)</td><td align="left" valign="top">0.83</td><td align="left" valign="top">0.81</td><td align="left" valign="top">0.82<break/>(0.81&#x2010;0.83)</td></tr><tr><td align="left" valign="top">Date of death</td><td align="left" valign="top">0.87</td><td align="left" valign="top">0.91</td><td align="left" valign="top">0.89<break/>(0.88&#x2010;0.90)</td><td align="left" valign="top">0.82</td><td align="left" valign="top">0.87</td><td align="left" valign="top">00.84<break/>(0.82&#x2010;0.86)</td><td align="left" valign="top">0.86</td><td align="left" valign="top">0.88</td><td align="left" valign="top">0.87<break/>(0.86&#x2010;0.89)</td><td align="left" valign="top">0.86</td><td align="left" valign="top">0.84</td><td align="left" valign="top">0.85<break/>(0.84&#x2010;0.86)</td></tr><tr><td align="left" valign="top">Date of birth</td><td align="left" valign="top">0.95</td><td align="left" valign="top">0.93</td><td align="left" valign="top">0.94<break/>(0.92&#x2010;0.94)</td><td align="left" valign="top">0.90</td><td align="left" valign="top">0.89</td><td align="left" valign="top">0.89<break/>(0.88&#x2010;0.90)</td><td align="left" valign="top">0.92</td><td align="left" valign="top">0.91</td><td align="left" valign="top">0.91<break/>(0.90&#x2010;0.93)</td><td align="left" valign="top">0.91</td><td align="left" valign="top">0.89</td><td align="left" valign="top">0.90<break/>(0.89&#x2010;0.91)</td></tr><tr><td align="left" valign="top">Microaverage</td><td align="left" valign="top">0.88</td><td align="left" valign="top">0.88</td><td align="left" valign="top">0.88<break/>(0.86&#x2010;0.90)</td><td align="left" valign="top">0.83</td><td align="left" valign="top">0.85</td><td align="left" valign="top">0.84<break/>(0.82&#x2010;0.86)</td><td align="left" valign="top">0.85</td><td align="left" valign="top">0.87</td><td align="left" valign="top">0.86<break/>(0.84&#x2010;0.86)</td><td align="left" valign="top">0.84</td><td align="left" valign="top">0.85</td><td align="left" valign="top">0.84<break/>(0.82&#x2010;0.86)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>ROBERTa: Robustly Optimized BERT Pretraining Approach.</p></fn><fn id="table2fn2"><p><sup>b</sup>BERT: Bidirectional Encoder Representations from Transformers.</p></fn><fn id="table2fn3"><p><sup>c</sup>ALBERT: A Lite BERT.</p></fn><fn id="table2fn4"><p><sup>d</sup>PPV: positive predictive value.</p></fn></table-wrap-foot></table-wrap><p>The accuracy of the primary CoD identification and all CoD identification for both FSL-LLM and human identification is as follows: for GoFundMe, FSL-LLM achieved an accuracy of 95.9% for primary cause and 56.4% for all causes, while human accuracy was 97.9% for primary cause and 93.3% for all causes. For Obituary, FSL-LLM accuracy was 96.5% for primary and 96% for all causes, with human accuracy at 99% for primary causes and 98.5% for all causes. For memorial websites, FSL-LLM accuracy was 98% for primary causes and 93.5% for all causes, whereas human accuracy was 99.5% for primary causes and 99% for all causes (<xref ref-type="table" rid="table3">Table 3</xref>).</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Accuracy of cause of death (CoD) identification (few-shot learning [FSL]-large language model [LLM] vs human).</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Source</td><td align="left" valign="bottom">FSL-LLM: primary CoD identification accuracy (%)</td><td align="left" valign="bottom">Human: primary CoD identification accuracy (%)</td><td align="left" valign="bottom">LLM: all CoD identification accuracy (%)</td><td align="left" valign="bottom">Human: all CoD identification accuracy (%)</td></tr></thead><tbody><tr><td align="left" valign="top">GoFundMe</td><td align="char" char="." valign="top">95.9</td><td align="char" char="." valign="top">97.9</td><td align="char" char="." valign="top">56.4</td><td align="char" char="." valign="top">93.3</td></tr><tr><td align="left" valign="top">Obituary</td><td align="char" char="." valign="top">96.5</td><td align="char" char="." valign="top">99</td><td align="char" char="." valign="top">96</td><td align="char" char="." valign="top">98.5</td></tr><tr><td align="left" valign="top">Memorial websites</td><td align="char" char="." valign="top">98</td><td align="char" char="." valign="top">99.5</td><td align="char" char="." valign="top">93.5</td><td align="char" char="." valign="top">99</td></tr></tbody></table></table-wrap><p>The precision, recall, and <italic>F</italic><sub>1</sub>-score for the LLM&#x2019;s versus human detection of the primary CoD were computed for each source. The metrics are presented in <xref ref-type="table" rid="table4">Table 4</xref>.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Precision, recall, and <italic>F</italic><sub>1</sub>-score for few-shot learning (FSL)-large language model (LLM) versus human (primary cause of death).</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">Sources</td><td align="left" valign="top" colspan="3">FSL-LLM</td><td align="left" valign="top" colspan="3">Human</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Precision</td><td align="left" valign="top">Recall</td><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">Precision</td><td align="left" valign="top">Recall</td><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score</td></tr></thead><tbody><tr><td align="left" valign="top">GoFundMe</td><td align="char" char="." valign="top">0.97</td><td align="char" char="." valign="top">0.95</td><td align="char" char="." valign="top">0.96</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">0.98</td><td align="char" char="." valign="top">0.99</td></tr><tr><td align="left" valign="top">Obituary</td><td align="char" char="." valign="top">0.61</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">0.76</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">0.82</td><td align="char" char="." valign="top">0.90</td></tr><tr><td align="left" valign="top">Memorial websites</td><td align="char" char="." valign="top">0.94</td><td align="char" char="." valign="top">0.98</td><td align="char" char="." valign="top">0.96</td><td align="char" char="." valign="top">1.00</td><td align="char" char="." valign="top">0.98</td><td align="char" char="." valign="top">0.99</td></tr></tbody></table></table-wrap></sec><sec id="s3-4"><title>Assessment of CoD Availability and Classification Error Analysis Across Social Media Sources</title><p>As shown in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>, social media sources varied significantly in the availability of CoD information. Obituaries had a very low density of CoD mentions, with only 6% (n=63) of 1,050 annotated posts containing any CoD. EverLoved posts primarily contained a single potential CoD, with 89% (n=934) of 1,050 posts including one cause. GoFundMe was the richest source, with 43% (n=451) of 1,050 posts containing a single CoD and 50% (n=525) containing multiple potential CoD mentions. However, not all mentioned CoDs or conditions pertained to the deceased individual referenced in the social media post.</p><p>The distribution and comparison of errors made by LLM and human annotators across the test dataset are illustrated in <xref ref-type="fig" rid="figure3">Figure 3</xref>. Each post may have multiple errors or error types. The analysis focuses on discrepancies in both primary and additional CoD annotations, providing a detailed breakdown of error types and frequencies. The errors include missed additional patient conditions, missed nonpatient conditions, missed primary causes, incorrect CoD annotated, ineligible notes annotated, nonpatient conditions attributed to the patient, and unclear annotation of no CoD.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Types of errors between LLM versus human annotation on the test dataset (errors per post). CoD: cause of death; FSL: few-shot learning; LLM: large language model.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e71113_fig03.png"/></fig><p>The disparate information density across the data sources (<xref ref-type="fig" rid="figure3">Figure 3</xref>) influenced the types of errors found within the annotations, though the human annotator consistently had higher rates of agreement with the adjudicator than the computer annotations. Obituaries had a low density of CoD information and very low error rates. The most common error made by the FSL algorithm was in the annotation of a CoD that was not mentioned in the post (3.5%), whereas the human annotator missed a mentioned CoD in 1% of posts. For memorial websites, both human and FSL-LLM annotations exhibited a small number of errors. FSL-LLM annotations missed mentions of medical conditions in 4.5% of posts and attributed primary causes incorrectly in only 2% of posts, whereas human annotators had an error rate of less than 1% for any category. For GoFundMe, which regularly mentions multiple patient and nonpatient conditions, the FSL-LLM model has similar error rates to human annotation except for &#x201C;missed nonpatient condition&#x201D; (10.5%) and &#x201C;missed additional patient conditions&#x201D; (31.5%) categories, indicating a performance gap compared to human annotations (1.5% and 3%, respectively) in identification of all potential medical conditions within the post though very low error rate in identification of the primary CoD.</p></sec><sec id="s3-5"><title>Final Collected Records</title><p>After applying the cleaning filters and NLP techniques, we successfully identified and extracted mortality-related information from a substantial number of documents across various sources. <xref ref-type="table" rid="table5">Table 5</xref> provides a summary of the total documents retained from each source.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Number of documents with mortality-related information identified from each source.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Source</td><td align="left" valign="bottom">Total documents, n</td></tr></thead><tbody><tr><td align="left" valign="top">GoFundMe</td><td align="left" valign="top">23,615</td></tr><tr><td align="left" valign="top">Memorial website (TributeArchive and EverLoved)</td><td align="left" valign="top">733,754</td></tr><tr><td align="left" valign="top">Obituaries</td><td align="left" valign="top">7,375,229</td></tr><tr><td align="left" valign="top">Total</td><td align="left" valign="top">8,132,598</td></tr></tbody></table></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>We used a novel approach to extract mortality data from web-based sources using transformer-based NLP models and FSL with LLMs. Our analysis demonstrated the effectiveness of fine-tuned transformer-based NLP models in extracting mortality data from diverse web-based sources, showcasing their potential to enhance traditional data collection methods. We also developed an FSL approach with LLMs to effectively identify primary CoD from web-based unstructured text data, achieving high agreement with human annotators. By leveraging publicly available web-based data, our approach has the potential to supplement conventional mortality databases, facilitating a more timely, comprehensive, and granular understanding of population-level mortality trends and risk factors.</p><p>Our study is consistent with other published papers that use social media data generally and obituary data specifically to improve the ability of health and health care research to accurately measure outcomes at the population level. For example, some studies have successfully used data from the Twitter platform to predict opioid overdose [<xref ref-type="bibr" rid="ref38">38</xref>] and heart disease mortality [<xref ref-type="bibr" rid="ref39">39</xref>], outperforming traditional demographic and health risk factors in predicting mortality. Additional studies have used GoFundMe data to identify disease categories in 89,645 medical crowdfunding campaigns [<xref ref-type="bibr" rid="ref40">40</xref>] and to identify factors associated with cancer fundraising success [<xref ref-type="bibr" rid="ref41">41</xref>]. An additional set of studies has used a range of techniques in web-based obituaries specifically, including automated surveillance of cancer mortality trends [<xref ref-type="bibr" rid="ref42">42</xref>], extraction of kinship data for genetic research [<xref ref-type="bibr" rid="ref43">43</xref>], and reporting of drug overdose [<xref ref-type="bibr" rid="ref44">44</xref>].</p><p>Our study extends the existing literature by using transformer-based NLP models, which enhanced the extraction of key components of mortality data across public sources. Models such as RoBERTa, ALBERT, BERTweet, and BERT showed strong performance in handling unstructured data to extract decedent names (first and last), dates of birth, and dates of death, with RoBERTa achieving the highest microaveraged <italic>F</italic><sub>1</sub>-score of 0.88 (95% CI 0.86&#x2010;0.90).</p><p>For primary CoD identification, our FSL-LLM approach demonstrated high accuracy across all sources (GoFundMe: 95.9%, obituaries: 96.5%, memorial websites: 98%), approximating human annotator performance (97.9%, 99%, and 99.5% respectively). Detailed performance metrics revealed robust results for GoFundMe (precision=0.97; recall=0.95; <italic>F</italic><sub>1</sub>=0.96) and memorial websites (precision=0.94; recall=0.98; <italic>F</italic><sub>1</sub>=0.96). Obituaries achieved high accuracy, though the precision-recall pattern (precision=0.61; recall=1.0; <italic>F</italic><sub>1</sub>=0.76) suggests potential for optimization in processing such data format. These findings demonstrate the model&#x2019;s effectiveness while highlighting opportunities for source-specific improvements.</p><p>FSL-LLM demonstrated equivalent performance to human annotations for CoD identification across all sources; there remains room for further enhancement to identify potential contributing CoDs. The error analysis indicates that FSL-LLM exhibited higher error in categories such as &#x201C;missed nonpatient condition&#x201D; and &#x201C;missed additional patient condition,&#x201D; whereas it exhibited very low rates of error in identifying primary CoD or appropriately classifying a note as having no specific CoD noted. This was primarily noted in GoFundMe data, as it was the only data source with significant posts containing more than 1 medical condition. Targeted improvements in the model&#x2019;s ability to identify nonpatient conditions and additional potential contributing causes are necessary to reduce these errors. The observed variation in error rates underscores the need for data-specific tuning to optimize model accuracy across different sources. To further enhance the FSL-LLM&#x2019;s performance, focused fine-tuning on the identified error types and the integration of more diverse training datasets are recommended.</p><p>An additional finding was the low information density observed in the data from the X platform relative to the other data sources allowing linkage to specific persons. The absence of reliable person identification in the data hinders reliable patient linkage, an essential element in the augmentation of mortality information and subsequent integration into the health care system. We therefore excluded Twitter data from the analysis after the annotation phase.</p><p>Automated extraction of key mortality information from web-based sources has the potential to significantly improve traditional mortality databases, which often experience delays and incomplete data. This approach enables the timely collection of crucial details surrounding mortality, such as decedent names, dates of birth, and dates of death, which could enable linkage to other health care data sources such as EHRs to facilitate clinical research. For instance, in studies monitoring medical product safety and effectiveness using insurance claims and EHR data, such as in the FDA Sentinel system, mortality information from publicly available sources using approaches described here could allow investigators to study inferential questions regarding the impact of medical products on overall and cause-specific mortality. Integrating these methods with health care systems can improve reporting timeliness and completeness [<xref ref-type="bibr" rid="ref45">45</xref>].</p></sec><sec id="s4-2"><title>Limitations</title><p>Despite promising results, this study has several limitations. First, social media data may not fully represent all population segments due to use and sharing biases. Second, although the NLP pipeline achieved high accuracy, the inherent ambiguity and scarcity of specific CoD mentions in the source data resulted in the underdetermination of some portions of the targeted information, as indicated by the human reference standard reviewers. Consequently, the NLP system may still misclassify some data points. Additionally, our reliance on keyword-based searches may miss relevant posts because of variations in language, slang, or indirect references to mortality, and the exclusion of non-English posts may limit generalizability. Moreover, social media posts may underreport stigmatized conditions such as HIV, suicide, or opioid-related deaths due to reporting bias, and the exclusion of nonusers may further affect data representativeness. Finally, CoD identification from text remains challenging, often requiring an understanding of context and relationships between mentioned conditions. While the FSL with the LLM algorithm performed well in identifying primary CoD, further work is needed to improve its ability to extract multiple contributing causes from individual posts. The use of a nurse adjudicator may also introduce correlated errors with the human-based reference, potentially providing a conservative estimate of model performance.</p></sec><sec id="s4-3"><title>Future Directions</title><p>At the population level, future research could focus on comparing CoD derived from web-based public data with those reported by official agencies. This comparison could help validate the accuracy and timeliness of web-based sourced mortality information. If validated, such data could potentially provide near real-time insights into emerging mortality trends, particularly for rapidly spreading causes such as infectious diseases or environmental exposures.</p><p>The integration of web-based sourced mortality data into existing surveillance systems would require careful validation against official records to ensure accuracy and reliability. This process would likely involve collaboration between researchers and public health agencies. Such collaborations could help develop protocols for effectively incorporating web-based data into public health surveillance and decision-making processes, potentially enhancing the speed and breadth of public health responses. Future research also should assess the plausibility of the CoD distribution from web-based sources by comparing it to sex- and age-adjusted national mortality statistics and investigating the potential underreporting of specific causes.</p></sec><sec id="s4-4"><title>Conclusions</title><p>We have demonstrated a promising application of advanced NLP techniques, including transformer-based models and FSL with LLMs, to extract critical mortality information and identify CoDs from diverse web-based public data sources. The successful development of an NLP pipeline and the strong performance of the FSL algorithm highlight the potential of these approaches to address limitations in traditional mortality databases and improve the timeliness, comprehensiveness, and granularity of mortality monitoring. However, the study acknowledges several limitations, such as potential biases in web-based data representation and challenges in extracting multiple contributing CoDs. Future research should focus on validating the usefulness of these methods in real-world settings, studying the correlation between digital-derived CoDs and official records, and improving the integration of web-based data into public health surveillance systems. Addressing these challenges and opportunities will strengthen the application of advanced NLP techniques to web-based public data for enhancing mortality surveillance.</p></sec></sec></body><back><ack><p>This project was supported by Task Order 75F40123F19010 under Master Agreement 75F40119D10037 from the US Food and Drug Administration (FDA). FDA coauthors reviewed the study protocol, statistical analysis plan, and the manuscript for scientific accuracy and clarity of presentation. Representatives of the FDA reviewed a draft of the manuscript for the presence of confidential information and accuracy regarding the statement of any FDA policy. The views expressed are those of the authors and not necessarily those of the US FDA.</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated and analyzed during this study are not publicly available due to the inclusion of sensitive health information and participant confidentiality constraints but are available from the corresponding author upon reasonable request. The code used for analysis is available at reference [<xref ref-type="bibr" rid="ref46">46</xref>].</p></sec></notes><fn-group><fn fn-type="con"><p>MA-G, RR, MEM, RJD, and JJH-M conceptualized the study. MA-G, ML-N, RJD, and MEM developed the methodology. MA-G, DW, ML-N, MEM, and MSK developed the software. JAD, JMW, ML-N, RR, and MFM performed validation. MA-G, XW, and AK conducted the formal analysis. MA-G, ML-N, and JMW led the investigation. MEM, MM, and RJD provided key resources. MFM, JAD, JMW, ML-N, and RR curated the data. MA-G, RJD, MEM, ML-N, and RR drafted the manuscript. RR, RJD, MM, JJH-M, XW, and AK reviewed and edited the manuscript. MA-G, DW, and ML-N created the visualizations. RR, MEM, RJD, and JJH-M supervised the study. ML-N led project administration. MEM, RJD, JJH-M, XW, and AK acquired funding. All authors had full access to the code, contributed to the manuscript, and approved the final version for submission.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ALBERT</term><def><p>A Lite BERT</p></def></def-item><def-item><term id="abb2">BERT</term><def><p>Bidirectional Encoder Representations From Transformers</p></def></def-item><def-item><term id="abb3">CoD</term><def><p>cause of death</p></def></def-item><def-item><term id="abb4">EHR</term><def><p>electronic health record</p></def></def-item><def-item><term id="abb5">FDA</term><def><p>Food and Drug Administration</p></def></def-item><def-item><term id="abb6">FSL</term><def><p>few-shot learning</p></def></def-item><def-item><term id="abb7">IAA</term><def><p>interannotator agreement</p></def></def-item><def-item><term id="abb8">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb9">NLP</term><def><p>natural language processing</p></def></def-item><def-item><term id="abb10">RoBERTa</term><def><p>Robustly Optimized BERT Pretraining Approach</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Weiss</surname><given-names>NS</given-names> </name></person-group><article-title>All-cause mortality as an outcome in epidemiologic studies: proceed with caution</article-title><source>Eur J Epidemiol</source><year>2014</year><month>03</month><volume>29</volume><issue>3</issue><fpage>147</fpage><lpage>149</lpage><pub-id pub-id-type="doi">10.1007/s10654-014-9899-y</pub-id><pub-id pub-id-type="medline">24729152</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Flegal</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Kit</surname><given-names>BK</given-names> </name><name name-style="western"><surname>Orpana</surname><given-names>H</given-names> </name><name name-style="western"><surname>Graubard</surname><given-names>BI</given-names> </name></person-group><article-title>Association of all-cause mortality with overweight and obesity using standard body mass index categories: a systematic review and meta-analysis</article-title><source>JAMA</source><year>2013</year><month>01</month><day>2</day><volume>309</volume><issue>1</issue><fpage>71</fpage><lpage>82</lpage><pub-id pub-id-type="doi">10.1001/jama.2012.113905</pub-id><pub-id pub-id-type="medline">23280227</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Berrington de Gonzalez</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hartge</surname><given-names>P</given-names> </name><name name-style="western"><surname>Cerhan</surname><given-names>JR</given-names> </name><etal/></person-group><article-title>Body-mass index and mortality among 1.46 million White adults</article-title><source>N Engl J Med</source><year>2010</year><month>12</month><day>2</day><volume>363</volume><issue>23</issue><fpage>2211</fpage><lpage>2219</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa1000367</pub-id><pub-id pub-id-type="medline">21121834</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Starfield</surname><given-names>B</given-names> </name></person-group><article-title>Is US health really the best in the world?</article-title><source>JAMA</source><year>2000</year><month>07</month><day>26</day><volume>284</volume><issue>4</issue><fpage>483</fpage><lpage>485</lpage><pub-id pub-id-type="doi">10.1001/jama.284.4.483</pub-id><pub-id pub-id-type="medline">10904513</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mieno</surname><given-names>MN</given-names> </name><name name-style="western"><surname>Tanaka</surname><given-names>N</given-names> </name><name name-style="western"><surname>Arai</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Accuracy of death certificates and assessment of factors for misclassification of underlying cause of death</article-title><source>J Epidemiol</source><year>2016</year><volume>26</volume><issue>4</issue><fpage>191</fpage><lpage>198</lpage><pub-id pub-id-type="doi">10.2188/jea.JE20150010</pub-id><pub-id pub-id-type="medline">26639750</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lauer</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Blackstone</surname><given-names>EH</given-names> </name><name name-style="western"><surname>Young</surname><given-names>JB</given-names> </name><name name-style="western"><surname>Topol</surname><given-names>EJ</given-names> </name></person-group><article-title>Cause of death in clinical research: time for a reassessment?</article-title><source>J Am Coll Cardiol</source><year>1999</year><month>09</month><volume>34</volume><issue>3</issue><fpage>618</fpage><lpage>620</lpage><pub-id pub-id-type="doi">10.1016/s0735-1097(99)00250-8</pub-id><pub-id pub-id-type="medline">10483939</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hart</surname><given-names>JD</given-names> </name><name name-style="western"><surname>Sorchik</surname><given-names>R</given-names> </name><name name-style="western"><surname>Bo</surname><given-names>KS</given-names> </name><etal/></person-group><article-title>Improving medical certification of cause of death: effective strategies and approaches based on experiences from the Data for Health Initiative</article-title><source>BMC Med</source><year>2020</year><month>03</month><day>9</day><volume>18</volume><issue>1</issue><fpage>74</fpage><pub-id pub-id-type="doi">10.1186/s12916-020-01519-8</pub-id><pub-id pub-id-type="medline">32146900</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ter-Minassian</surname><given-names>M</given-names> </name><name name-style="western"><surname>Basra</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Watson</surname><given-names>ES</given-names> </name><name name-style="western"><surname>Derus</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Horberg</surname><given-names>MA</given-names> </name></person-group><article-title>Validation of US CDC National Death Index mortality data, focusing on differences in race and ethnicity</article-title><source>BMJ Health Care Inform</source><year>2023</year><month>07</month><volume>30</volume><issue>1</issue><fpage>e100737</fpage><pub-id pub-id-type="doi">10.1136/bmjhci-2023-100737</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Antolini</surname><given-names>L</given-names> </name><name name-style="western"><surname>DiFrancesco</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Zedde</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Spontaneous ARIA-like events in cerebral amyloid angiopathy-related inflammation: a multicenter prospective longitudinal cohort study</article-title><source>Neurology (ECronicon)</source><year>2021</year><month>11</month><day>2</day><volume>97</volume><issue>18</issue><fpage>e1809</fpage><lpage>e1822</lpage><pub-id pub-id-type="doi">10.1212/WNL.0000000000012778</pub-id><pub-id pub-id-type="medline">34531298</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Riley</surname><given-names>GF</given-names> </name></person-group><article-title>Administrative and claims records as sources of health care cost data</article-title><source>Med Care</source><year>2009</year><month>07</month><volume>47</volume><issue>7 Suppl 1</issue><fpage>S51</fpage><lpage>5</lpage><pub-id pub-id-type="doi">10.1097/MLR.0b013e31819c95aa</pub-id><pub-id pub-id-type="medline">19536019</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Haut</surname><given-names>ER</given-names> </name><name name-style="western"><surname>Pronovost</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Schneider</surname><given-names>EB</given-names> </name></person-group><article-title>Limitations of administrative databases</article-title><source>JAMA</source><year>2012</year><month>06</month><day>27</day><volume>307</volume><issue>24</issue><fpage>2589</fpage><pub-id pub-id-type="doi">10.1001/jama.2012.6626</pub-id><pub-id pub-id-type="medline">22735421</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Taksler</surname><given-names>GB</given-names> </name><name name-style="western"><surname>Dalton</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Perzynski</surname><given-names>AT</given-names> </name><etal/></person-group><article-title>Opportunities, pitfalls, and alternatives in adapting electronic health records for health services research</article-title><source>Med Decis Making</source><year>2021</year><month>02</month><volume>41</volume><issue>2</issue><fpage>133</fpage><lpage>142</lpage><pub-id pub-id-type="doi">10.1177/0272989X20954403</pub-id><pub-id pub-id-type="medline">32969760</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aiello</surname><given-names>AE</given-names> </name><name name-style="western"><surname>Renson</surname><given-names>A</given-names> </name><name name-style="western"><surname>Zivich</surname><given-names>PN</given-names> </name></person-group><article-title>Social media- and internet-based disease surveillance for public health</article-title><source>Annu Rev Public Health</source><year>2020</year><month>04</month><day>2</day><volume>41</volume><fpage>101</fpage><lpage>118</lpage><pub-id pub-id-type="doi">10.1146/annurev-publhealth-040119-094402</pub-id><pub-id pub-id-type="medline">31905322</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abdullah</surname><given-names>S</given-names> </name><name name-style="western"><surname>Choudhury</surname><given-names>T</given-names> </name></person-group><article-title>Sensing technologies for monitoring serious mental illnesses</article-title><source>IEEE MultiMedia</source><year>2018</year><volume>25</volume><issue>1</issue><fpage>61</fpage><lpage>75</lpage><pub-id pub-id-type="doi">10.1109/MMUL.2018.011921236</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Charles-Smith</surname><given-names>LE</given-names> </name><name name-style="western"><surname>Reynolds</surname><given-names>TL</given-names> </name><name name-style="western"><surname>Cameron</surname><given-names>MA</given-names> </name><etal/></person-group><article-title>Using social media for actionable disease surveillance and outbreak management: a systematic literature review</article-title><source>PLoS ONE</source><year>2015</year><volume>10</volume><issue>10</issue><fpage>e0139701</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0139701</pub-id><pub-id pub-id-type="medline">26437454</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dey</surname><given-names>V</given-names> </name><name name-style="western"><surname>Krasniak</surname><given-names>P</given-names> </name><name name-style="western"><surname>Nguyen</surname><given-names>M</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>C</given-names> </name><name name-style="western"><surname>Ning</surname><given-names>X</given-names> </name></person-group><article-title>A pipeline to understand emerging illness via social media data analysis: case study on breast implant illness</article-title><source>JMIR Med Inform</source><year>2021</year><month>11</month><day>29</day><volume>9</volume><issue>11</issue><fpage>e29768</fpage><pub-id pub-id-type="doi">10.2196/29768</pub-id><pub-id pub-id-type="medline">34847064</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chapman</surname><given-names>B</given-names> </name><name name-style="western"><surname>Raymond</surname><given-names>B</given-names> </name><name name-style="western"><surname>Powell</surname><given-names>D</given-names> </name></person-group><article-title>Potential of social media as a tool to combat foodborne illness</article-title><source>Perspect Public Health</source><year>2014</year><month>07</month><volume>134</volume><issue>4</issue><fpage>225</fpage><lpage>230</lpage><pub-id pub-id-type="doi">10.1177/1757913914538015</pub-id><pub-id pub-id-type="medline">24990140</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>De Choudhury</surname><given-names>M</given-names> </name><name name-style="western"><surname>Gamon</surname><given-names>M</given-names> </name><name name-style="western"><surname>Counts</surname><given-names>S</given-names> </name><name name-style="western"><surname>Horvitz</surname><given-names>E</given-names> </name></person-group><article-title>Predicting depression via social media</article-title><source>Proc Int AAAI Conf Weblogs Soc Media</source><year>2013</year><volume>7</volume><pub-id pub-id-type="doi">10.1609/icwsm.v7i1.14432</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Centola</surname><given-names>D</given-names> </name></person-group><article-title>Social media and the science of health behavior</article-title><source>Circulation</source><year>2013</year><month>05</month><day>28</day><volume>127</volume><issue>21</issue><fpage>2135</fpage><lpage>2144</lpage><pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.112.101816</pub-id><pub-id pub-id-type="medline">23716382</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>De Choudhury</surname><given-names>M</given-names> </name><name name-style="western"><surname>Counts</surname><given-names>S</given-names> </name><name name-style="western"><surname>Horvitz</surname><given-names>E</given-names> </name></person-group><article-title>Predicting postpartum changes in emotion and behavior via social media</article-title><conf-name>CHI &#x2019;13: CHI Conference on Human Factors in Computing Systems</conf-name><conf-date>Apr 27 to May 2, 2013</conf-date><conf-loc>Paris, France</conf-loc><pub-id pub-id-type="doi">10.1145/2470654.2466447</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Al-Garadi</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Khan</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Varathan</surname><given-names>KD</given-names> </name><name name-style="western"><surname>Mujtaba</surname><given-names>G</given-names> </name><name name-style="western"><surname>Al-Kabsi</surname><given-names>AM</given-names> </name></person-group><article-title>Using online social networks to track a pandemic: a systematic review</article-title><source>J Biomed Inform</source><year>2016</year><month>08</month><volume>62</volume><fpage>1</fpage><lpage>11</lpage><pub-id pub-id-type="doi">10.1016/j.jbi.2016.05.005</pub-id><pub-id pub-id-type="medline">27224846</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Naslund</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Bondre</surname><given-names>A</given-names> </name><name name-style="western"><surname>Torous</surname><given-names>J</given-names> </name><name name-style="western"><surname>Aschbrenner</surname><given-names>KA</given-names> </name></person-group><article-title>Social media and mental health: benefits, risks, and opportunities for research and practice</article-title><source>J Technol Behav Sci</source><year>2020</year><month>09</month><volume>5</volume><issue>3</issue><fpage>245</fpage><lpage>257</lpage><pub-id pub-id-type="doi">10.1007/s41347-020-00134-x</pub-id><pub-id pub-id-type="medline">33415185</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Stefanidis</surname><given-names>A</given-names> </name><name name-style="western"><surname>Crooks</surname><given-names>A</given-names> </name><name name-style="western"><surname>Radzikowski</surname><given-names>J</given-names> </name></person-group><article-title>Harvesting ambient geospatial information from social media feeds</article-title><source>GeoJournal</source><year>2013</year><month>04</month><volume>78</volume><issue>2</issue><fpage>319</fpage><lpage>338</lpage><pub-id pub-id-type="doi">10.1007/s10708-011-9438-2</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Broniatowski</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Paul</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Dredze</surname><given-names>M</given-names> </name></person-group><article-title>National and local influenza surveillance through Twitter: an analysis of the 2012-2013 influenza epidemic</article-title><source>PLoS One</source><year>2013</year><volume>8</volume><issue>12</issue><fpage>e83672</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0083672</pub-id><pub-id pub-id-type="medline">24349542</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sarker</surname><given-names>A</given-names> </name><name name-style="western"><surname>Ginn</surname><given-names>R</given-names> </name><name name-style="western"><surname>Nikfarjam</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Utilizing social media data for pharmacovigilance: a review</article-title><source>J Biomed Inform</source><year>2015</year><month>04</month><volume>54</volume><fpage>202</fpage><lpage>212</lpage><pub-id pub-id-type="doi">10.1016/j.jbi.2015.02.004</pub-id><pub-id pub-id-type="medline">25720841</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Al-Garadi</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>YC</given-names> </name><name name-style="western"><surname>Cai</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Text classification models for the automatic detection of nonmedical prescription medication use from social media</article-title><source>BMC Med Inform Decis Mak</source><year>2021</year><month>01</month><day>26</day><volume>21</volume><issue>1</issue><fpage>27</fpage><pub-id pub-id-type="doi">10.1186/s12911-021-01394-0</pub-id><pub-id pub-id-type="medline">33499852</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thackeray</surname><given-names>R</given-names> </name><name name-style="western"><surname>Neiger</surname><given-names>BL</given-names> </name><name name-style="western"><surname>Smith</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Van Wagenen</surname><given-names>SB</given-names> </name></person-group><article-title>Adoption and use of social media among public health departments</article-title><source>BMC Public Health</source><year>2012</year><month>03</month><day>26</day><volume>12</volume><fpage>1</fpage><lpage>6</lpage><pub-id pub-id-type="doi">10.1186/1471-2458-12-242</pub-id><pub-id pub-id-type="medline">22449137</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vereen</surname><given-names>RN</given-names> </name><name name-style="western"><surname>Kurtzman</surname><given-names>R</given-names> </name><name name-style="western"><surname>Noar</surname><given-names>SM</given-names> </name></person-group><article-title>Are social media interventions for health behavior change efficacious among populations with health disparities?: A meta-analytic review</article-title><source>Health Commun</source><year>2023</year><month>01</month><volume>38</volume><issue>1</issue><fpage>133</fpage><lpage>140</lpage><pub-id pub-id-type="doi">10.1080/10410236.2021.1937830</pub-id><pub-id pub-id-type="medline">34148445</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gough</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hunter</surname><given-names>RF</given-names> </name><name name-style="western"><surname>Ajao</surname><given-names>O</given-names> </name><etal/></person-group><article-title>Tweet for behavior change: using social media for the dissemination of public health messages</article-title><source>JMIR Public Health Surveill</source><year>2017</year><month>03</month><day>23</day><volume>3</volume><issue>1</issue><fpage>e14</fpage><pub-id pub-id-type="doi">10.2196/publichealth.6313</pub-id><pub-id pub-id-type="medline">28336503</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fung</surname><given-names>ICH</given-names> </name><name name-style="western"><surname>Tse</surname><given-names>ZTH</given-names> </name><name name-style="western"><surname>Fu</surname><given-names>KW</given-names> </name></person-group><article-title>The use of social media in public health surveillance</article-title><source>Western Pac Surveill Response J</source><year>2015</year><volume>6</volume><issue>2</issue><fpage>3</fpage><lpage>6</lpage><pub-id pub-id-type="doi">10.5365/WPSAR.2015.6.1.019</pub-id><pub-id pub-id-type="medline">26306208</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McHugh</surname><given-names>ML</given-names> </name></person-group><article-title>Interrater reliability: the kappa statistic</article-title><source>Biochem Med (Zagreb)</source><year>2012</year><volume>22</volume><issue>3</issue><fpage>276</fpage><lpage>282</lpage><pub-id pub-id-type="medline">23092060</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>South</surname><given-names>B</given-names> </name><name name-style="western"><surname>Shen</surname><given-names>S</given-names> </name><name name-style="western"><surname>Leng</surname><given-names>J</given-names> </name><name name-style="western"><surname>Forbush</surname><given-names>TB</given-names> </name><name name-style="western"><surname>DuVall</surname><given-names>SL</given-names> </name><name name-style="western"><surname>Chapman</surname><given-names>WW</given-names> </name></person-group><article-title>A prototype tool set to support machine-assisted annotation</article-title><conf-name>BioNLP: Proceedings of the 2012 Workshop on Biomedical Natural Language Processing</conf-name><conf-date>Jun 8, 2012</conf-date><conf-loc>Montreal, Canada</conf-loc></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Devlin</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>MW</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>K</given-names> </name><name name-style="western"><surname>Toutanova</surname><given-names>K</given-names> </name></person-group><article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title><source>arXiv</source><comment>Preprint posted online on  May 24, 2019</comment><pub-id pub-id-type="doi">10.48550/arXiv.1810.04805</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ott</surname><given-names>M</given-names> </name><name name-style="western"><surname>Goyal</surname><given-names>N</given-names> </name><etal/></person-group><article-title>RoBERTa: a robustly optimized BERT pretraining approach</article-title><source>arXiv</source><comment>Preprint posted online on  Jul 26, 2019</comment><pub-id pub-id-type="doi">10.48550/arXiv.1907.11692</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Lan</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>M</given-names> </name><name name-style="western"><surname>Goodman</surname><given-names>S</given-names> </name><name name-style="western"><surname>Gimpel</surname><given-names>K</given-names> </name><name name-style="western"><surname>Sharma</surname><given-names>P</given-names> </name><name name-style="western"><surname>Soricut</surname><given-names>R</given-names> </name></person-group><article-title>ALBERT: A Lite BERT for self-supervised learning of language representations</article-title><source>arXiv</source><comment>Preprint posted online on  Feb 9, 2020</comment><pub-id pub-id-type="doi">10.48550/arXiv.1909.11942</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Nguyen</surname><given-names>DQ</given-names> </name><name name-style="western"><surname>Vu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Nguyen</surname><given-names>AT</given-names> </name></person-group><article-title>BERTweet: a pre-trained language model for english tweets</article-title><source>arXiv</source><comment>Preprint posted online on  Oct 5, 2020</comment><pub-id pub-id-type="doi">10.48550/arXiv.2005.10200</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Touvron</surname><given-names>H</given-names> </name><name name-style="western"><surname>Lavril</surname><given-names>T</given-names> </name><name name-style="western"><surname>Izacard</surname><given-names>G</given-names> </name><etal/></person-group><article-title>LLaMA: open and efficient foundation language models</article-title><source>arXiv</source><year>2023</year><month>02</month><day>27</day><pub-id pub-id-type="doi">10.48550/arXiv.2302.13971</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Giorgi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yaden</surname><given-names>DB</given-names> </name><name name-style="western"><surname>Eichstaedt</surname><given-names>JC</given-names> </name><etal/></person-group><article-title>Predicting U.S. county opioid poisoning mortality from multi-modal social media and psychological self-report data</article-title><source>Sci Rep</source><year>2023</year><month>06</month><day>3</day><volume>13</volume><issue>1</issue><fpage>9027</fpage><pub-id pub-id-type="doi">10.1038/s41598-023-34468-2</pub-id><pub-id pub-id-type="medline">37270657</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Eichstaedt</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Schwartz</surname><given-names>HA</given-names> </name><name name-style="western"><surname>Kern</surname><given-names>ML</given-names> </name><etal/></person-group><article-title>Psychological language on Twitter predicts county-level heart disease mortality</article-title><source>Psychol Sci</source><year>2015</year><month>02</month><volume>26</volume><issue>2</issue><fpage>159</fpage><lpage>169</lpage><pub-id pub-id-type="doi">10.1177/0956797614557867</pub-id><pub-id pub-id-type="medline">25605707</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Doerstling</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Akrobetu</surname><given-names>D</given-names> </name><name name-style="western"><surname>Engelhard</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>F</given-names> </name><name name-style="western"><surname>Ubel</surname><given-names>PA</given-names> </name></person-group><article-title>A disease identification algorithm for medical crowdfunding campaigns: validation study</article-title><source>J Med Internet Res</source><year>2022</year><month>06</month><day>21</day><volume>24</volume><issue>6</issue><fpage>e32867</fpage><pub-id pub-id-type="doi">10.2196/32867</pub-id><pub-id pub-id-type="medline">35727610</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Tao</surname><given-names>X</given-names> </name><name name-style="western"><surname>Ji</surname><given-names>B</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>R</given-names> </name><name name-style="western"><surname>S&#x00F6;rensen</surname><given-names>S</given-names> </name></person-group><article-title>The success of cancer crowdfunding campaigns: project and text analysis</article-title><source>J Med Internet Res</source><year>2023</year><month>03</month><day>3</day><volume>25</volume><fpage>e44197</fpage><pub-id pub-id-type="doi">10.2196/44197</pub-id><pub-id pub-id-type="medline">36692283</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tourassi</surname><given-names>G</given-names> </name><name name-style="western"><surname>Yoon</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>S</given-names> </name></person-group><article-title>A novel web informatics approach for automated surveillance of cancer mortality trends</article-title><source>J Biomed Inform</source><year>2016</year><month>06</month><volume>61</volume><fpage>110</fpage><lpage>118</lpage><pub-id pub-id-type="doi">10.1016/j.jbi.2016.03.027</pub-id><pub-id pub-id-type="medline">27044930</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>He</surname><given-names>K</given-names> </name><name name-style="western"><surname>Yao</surname><given-names>L</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>C</given-names> </name></person-group><article-title>Construction of genealogical knowledge graphs from obituaries: multitask neural network extraction system</article-title><source>J Med Internet Res</source><year>2021</year><month>08</month><day>4</day><volume>23</volume><issue>8</issue><fpage>e25670</fpage><pub-id pub-id-type="doi">10.2196/25670</pub-id><pub-id pub-id-type="medline">34346903</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Warren</surname><given-names>K</given-names> </name></person-group><source>From Death Notice to the Cyber Obit: The History of the Overdose Obituary (Unpublished manuscript)</source><access-date>2025-07-16</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://projects.iq.harvard.edu/files/historyopioidepidemic/files/katherine_warren_paper.pdf?utm_source=chatgpt.com">https://projects.iq.harvard.edu/files/historyopioidepidemic/files/katherine_warren_paper.pdf?utm_source=chatgpt.com</ext-link></comment></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>LeNoue-Newton</surname><given-names>M</given-names> </name><name name-style="western"><surname>al-Garadi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ngan</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Augmenting fact and date of death in electronic health records using internet media sources: a validation study from two large healthcare systems</article-title><source>medRxiv</source><comment>Preprint posted online on  Jan 27, 2025</comment><pub-id pub-id-type="doi">10.1101/2025.01.24.25321042</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Al-Garadi</surname><given-names>M</given-names> </name><name name-style="western"><surname>LeNoue-Newton</surname><given-names>M</given-names> </name><name name-style="western"><surname>Matheny</surname><given-names>ME</given-names> </name><etal/></person-group><article-title>Automated extraction of mortality information from publicly available sources using language models</article-title><source>medRxiv</source><comment>Preprint posted online on  Nov 1, 2024</comment><pub-id pub-id-type="doi">10.1101/2024.10.28.24316027</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Annotation guidelines, metric definitions, confusion matrices, and prompt examples used for extracting mortality information and causes of death from public web-based posts.</p><media xlink:href="jmir_v27i1e71113_app1.docx" xlink:title="DOCX File, 379 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Availability of cause of death within social media posts. Social media posts were annotated for potential causes of death using the annotation guidelines outlined in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Social media sources were assessed for information density related to cause of death information by categorizing a post as having either no medical conditions mentioned, a single medical condition mentioned, or having multiple unique medical conditions within the post.</p><media xlink:href="jmir_v27i1e71113_app2.png" xlink:title="PNG File, 107 KB"/></supplementary-material></app-group></back></article>