<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id><journal-id journal-id-type="publisher-id">jmir</journal-id><journal-id journal-id-type="index">1</journal-id><journal-title>Journal of Medical Internet Research</journal-title><abbrev-journal-title>J Med Internet Res</abbrev-journal-title><issn pub-type="epub">1438-8871</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v28i1e85057</article-id><article-id pub-id-type="doi">10.2196/85057</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Large Language Model&#x2013;Based Analysis of Statin Therapy Discussions and Sentiment on Social Media: Cross-Sectional Observational Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Liu</surname><given-names>Siru</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Liu</surname><given-names>Jialin</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Biomedical Informatics, Vanderbilt University Medical Center</institution><addr-line>2525 West End Ave #1475</addr-line><addr-line>Nashville</addr-line><addr-line>TN</addr-line><country>United States</country></aff><aff id="aff2"><institution>Department of Computer Science, Vanderbilt University</institution><addr-line>Nashville</addr-line><addr-line>TN</addr-line><country>United States</country></aff><aff id="aff3"><institution>Department of Medical Informatics, West China Medical School</institution><addr-line>Chengdu</addr-line><country>China</country></aff><aff id="aff4"><institution>Department of Otolaryngology-Head and Neck Surgery, West China Hospital, Sichuan University</institution><addr-line>Chengdu</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Wreyford</surname><given-names>Leon</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Zhu</surname><given-names>Yenan</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Siru Liu, PhD, Department of Biomedical Informatics, Vanderbilt University Medical Center, 2525 West End Ave #1475, Nashville, TN, 610041, United States, 1 615-875-5216; <email>siru.liu@vumc.org</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>10</day><month>4</month><year>2026</year></pub-date><volume>28</volume><elocation-id>e85057</elocation-id><history><date date-type="received"><day>30</day><month>09</month><year>2025</year></date><date date-type="rev-recd"><day>02</day><month>02</month><year>2026</year></date><date date-type="accepted"><day>24</day><month>03</month><year>2026</year></date></history><copyright-statement>&#x00A9; Siru Liu, Jialin Liu. Originally published in the Journal of Medical Internet Research (<ext-link ext-link-type="uri" xlink:href="https://www.jmir.org">https://www.jmir.org</ext-link>), 10.4.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.jmir.org/">https://www.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.jmir.org/2026/1/e85057"/><abstract><sec><title>Background</title><p>Statin therapy, despite proven cardiovascular benefits, remains underused. Social media platforms may capture patient perspectives that are less visible in clinical encounters.</p></sec><sec><title>Objective</title><p>This study aimed to characterize themes, sentiment, and decision-making factors related to statin therapy through large language model (LLM)&#x2013;based analysis of Reddit discussions.</p></sec><sec sec-type="methods"><title>Methods</title><p>This cross-sectional observational study analyzed English-language Reddit posts and comments mentioning statins from January 2022 to May 2025, identified via keyword-based Reddit application programming interface searches (&#x2264;1000 posts per keyword). A total of 5328 retrieved discussions (n=1661, 31.2% posts and n=3667, 68.8% keyword-containing comments) from public subreddits were included. Themes, sentiments (positive, neutral, or negative), guideline-informed clinical relevance, information-seeking behavior, adverse effect mentions, decision factors, and adherence-related content were extracted using an LLM-based pipeline.</p></sec><sec sec-type="results"><title>Results</title><p>Among 5328 discussions, prominent topics included adverse effects (n=1697, 31.9%), decision-making references related to laboratory results and physician advice (n=2767, 51.9% and n=2034, 38.2%, respectively), and alternative approaches (n=2485, 46.6%). Overall sentiment was neutral in 34% (n=1812) of discussions, negative in 30.9% (n=1646), and positive in 16.9% (n=900); the remainder were mixed or unclear. Statin-directed sentiment was neutral in 44.1% (n=2350) of discussions, negative in 25.2% (n=1343), and positive in 12.5% (n=666); the remainder did not express statin-directed sentiment. High clinical relevance was identified in 12.6% (n=672) of discussions. Adherence-related issues were mentioned in 29.8% (n=1587) of discussions. Among adverse effect mentions, muscle pain (n=129, 7.6%) and fatigue (n=110, 6.5%) were common.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>LLM-enabled analysis of Reddit discourse highlights substantial negative sentiment, adherence-related concerns, and adverse effect narratives surrounding statin therapy. These findings suggest opportunities for patient-centered communication and shared decision-making strategies that address symptom attribution, uncertainty, and information needs in digital information environments.</p></sec></abstract><kwd-group><kwd>statin therapy</kwd><kwd>social media</kwd><kwd>large language model</kwd><kwd>sentiment analysis</kwd><kwd>Reddit</kwd><kwd>cardiovascular disease</kwd><kwd>patient perspectives</kwd><kwd>adherence</kwd><kwd>adverse effects</kwd><kwd>cohort study</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Statins are among the most widely prescribed medications globally, with more than 200 million individuals using these agents to reduce cardiovascular morbidity and mortality [<xref ref-type="bibr" rid="ref1">1</xref>]. These 3-hydroxy-3-methylglutaryl coenzyme A reductase inhibitors remain the cornerstone of atherosclerotic cardiovascular disease (ASCVD) prevention, demonstrating well-established efficacy in both primary and secondary prevention settings [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Despite their proven benefits, real-world statin therapy is frequently limited by concerns regarding safety and tolerability. In routine care, statin-related events are commonly documented, with myalgia and myopathy representing the most frequent category, and these events often precipitate temporary discontinuation and subsequent rechallenge [<xref ref-type="bibr" rid="ref4">4</xref>]. Consequently, long-term use remains suboptimal; a recent systematic review and meta-analysis found that only approximately 62% of patients achieve good adherence (&#x2265;80% use) over a median follow-up of 24 months [<xref ref-type="bibr" rid="ref5">5</xref>], while population-based primary care data show frequent discontinuation with substantial restarting, consistent with an intermittent use pattern in practice [<xref ref-type="bibr" rid="ref6">6</xref>].</p><p>Traditional clinical research methods, including randomized controlled trials and observational studies, may not fully capture the breadth of patient experiences and concerns in routine care [<xref ref-type="bibr" rid="ref7">7</xref>]. Effective communication between patients and health care providers is essential for shared decision-making and treatment adherence; however, barriers such as limited consultation time, health literacy challenges, and patient reluctance to disclose adverse experiences may constrain insight into the real-world challenges of medication use [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Patients may hesitate to report symptoms or concerns to clinicians due to fear of judgment, desire to avoid conflict with prescribers, or uncertainty about whether their experiences warrant clinical attention [<xref ref-type="bibr" rid="ref9">9</xref>]. Social media platforms, especially Reddit (Reddit, Inc), provide access to unfiltered patient narratives that may not be expressed during clinical encounters [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. Reddit hosts a wide range of health-related communities and has more than 50 million daily active users [<xref ref-type="bibr" rid="ref14">14</xref>]. Within these forums, individuals share personal medical experiences, seek peer advice, and discuss treatment decisions. These discussions may provide valuable insights into patient beliefs, motivations, and barriers that influence medication adherence and cardiovascular risk management [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref17">17</xref>].</p><p>Recent advances in large language models (LLMs) offer scalable methods to analyze such unstructured, high-volume textual data, enabling systematic characterization of patient perspectives at a granularity that would be infeasible using manual qualitative approaches alone [<xref ref-type="bibr" rid="ref18">18</xref>]. In the context of cardiovascular prevention, applying LLMs to social media discourse may provide novel insights into how patients interpret statin-related information, evaluate perceived risks and benefits, and make adherence decisions outside the clinical setting. Accordingly, this study aimed to systematically analyze Reddit discussions related to statin use using an LLM to characterize patient-reported experiences, identify recurrent concerns and misconceptions, and explore factors influencing decision-making and adherence. By integrating patient-generated narratives with computational text analysis, this work seeks to complement traditional evidence sources and inform more patient-centered approaches to cardiovascular risk management.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design and Data Source</title><p>This cross-sectional study analyzed publicly available Reddit discussions about statin therapy posted between January 1, 2022, and May 1, 2025. Reddit was selected because it hosts large, topic-specific health communities in which users openly share medication experiences, treatment decisions, and interactions with health care providers in naturalistic settings. Data were accessed via the official Reddit application programming interface (API) using Python Reddit API Wrapper, limited to public subreddits, and no user contact or reidentification attempts were made.</p></sec><sec id="s2-2"><title>Data Collection</title><sec id="s2-2-1"><title>Search Strategy</title><p>We retrieved content using &#x201C;statin,&#x201D; generic statin names (eg, atorvastatin, rosuvastatin, simvastatin, pravastatin, lovastatin, fluvastatin, and pitavastatin), and US brand names (eg, Lipitor, Crestor, Zocor, Pravachol, Livalo, Lescol, and Mevacor); full queries are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-2-2"><title>API Procedure</title><p>Using Python Reddit API Wrapper (version 7.7.1) in Python (version 3.9; Python Software Foundation; May 15-May 20, 2025), we queried Reddit&#x2019;s search end point (sorted by &#x201C;new&#x201D; where available). Due to indexing and API constraints, each keyword returned up to 1000 submissions. For each submission, we extracted metadata (submission ID, created_utc, subreddit, title, selftext, author, score, comment count, and permalink) and downloaded its comment tree (comment ID, parent ID, created_utc, author, body, and score). We retained submissions within the study window; pagination, time stamps, and rate-limit handling are described in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-2-3"><title>Eligibility</title><p>We included English-language posts and comments from public subreddits that matched 1 or more keywords (case-insensitive) within the study window and excluded removed and deleted placeholders, duplicates, non-English text (langdetect v1.0.9), and promotional and spam content (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s2-2-4"><title>Unit of Analysis</title><p>The unit of analysis was a Reddit discussion thread (eligible submission plus associated comments), enabling contextual interpretation of patient narratives and peer responses and supporting downstream LLM-based thematic extraction [<xref ref-type="bibr" rid="ref19">19</xref>].</p></sec></sec><sec id="s2-3"><title>Data Cleaning and Preprocessing</title><p>We removed URLs and normalized whitespace while preserving the original wording (no stemming or lemmatization). Privacy protection included removing @mentions and replacing detected email addresses and phone numbers with placeholders (eg, &#x201C;[EMAIL],&#x201D; &#x201C;[PHONE]&#x201D;); subreddit names were retained as public metadata, with reidentification risk minimized via aggregate reporting and avoidance of traceable quotations [<xref ref-type="bibr" rid="ref20">20</xref>]. English language posts were identified using fastText (lid.176.bin) [<xref ref-type="bibr" rid="ref21">21</xref>] (retain &#x2265;0.80, adjudicate 0.60-0.80 by 2 investigators, and exclude &#x003C;0.60). For analysis, comments were retained if they contained 1 or more keywords; misspellings and variants were captured via regex-based partial matching with guardrails. Exact duplicates were removed via SHA-256 hashing, and near duplicates were excluded using MinHash with Jaccard similarity &#x2265;0.85 [<xref ref-type="bibr" rid="ref22">22</xref>]. All steps were deterministic and version controlled; a PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses)&#x2013;style flow diagram is provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-4"><title>LLM-Based Content Extraction</title><p>Structured extraction used GPT-4.1 [<xref ref-type="bibr" rid="ref23">23</xref>] via the OpenAI API (version 1.52.0) between May and June 2025 with standardized parameters (temperature=0.1, top_p=1.0, and max_tokens=4096). A single prompt template and predefined JSON schema were applied to all discussions. Two investigators iteratively developed the schema and decision rules through pilot testing on 50 purposively sampled discussions and consensus refinement of edge cases, consistent with clinical reasoning standards [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. For 11 analytic domains (<xref ref-type="table" rid="table1">Table 1</xref>), outputs included structured variables, brief summaries, and verbatim evidence quotes supporting key classifications. Dietary changes and exercise were coded as alternative approaches only when explicitly discussed as substitutes for statin therapy (eg, attempting to avoid, delay, or discontinue statins); when described as adjuncts alongside statins, they were not classified as alternatives. Outputs failing JSON validation or missing mandatory evidence were automatically requeried up to 3 times; only schema-valid outputs were retained (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>).</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>GPT-4.1 content analysis framework with examples.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Domain</td><td align="left" valign="bottom">Description</td><td align="left" valign="bottom">Example extractions</td></tr></thead><tbody><tr><td align="left" valign="top">Primary themes</td><td align="left" valign="top">1 to 3 main discussion topics</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Concerns about statin adverse effects, cholesterol management through lifestyle changes, and physician-patient communication</p></list-item></list></td></tr><tr><td align="left" valign="top">Statin medications</td><td align="left" valign="top">Specific statin names mentioned</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Generic: atorvastatin and rosuvastatin</p></list-item><list-item><p>Brand: Lipitor and Crestor</p></list-item></list></td></tr><tr><td align="left" valign="top">Experience type</td><td align="left" valign="top">Postclassification</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Personal experience, information request, and medical advice</p></list-item></list></td></tr><tr><td align="left" valign="top">Sentiment analysis</td><td align="left" valign="top">Multitarget emotional assessment</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Neutral, negative, or positive</p></list-item><list-item><p>Overall, toward statins and toward physicians</p></list-item></list></td></tr><tr><td align="left" valign="top">Clinical relevance</td><td align="left" valign="top">Actionable insight assessment based on AHA<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> and ACC<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> guidelines</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>High: ASCVD<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup> history (MI<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup>, stroke, and PAD<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup>), LDL-C<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup> &#x2265;190 mg/dL, diabetes (in individuals aged 40&#x2010;75 years), and 10-year ASCVD risk &#x2265;7.5%</p></list-item><list-item><p>Medium: family history of premature ASCVD, chronic kidney disease, inflammatory conditions, CAC<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup> score &#x2265;100, and smoking</p></list-item><list-item><p>Low: general cardiovascular health discussions</p></list-item></list></td></tr><tr><td align="left" valign="top">Adverse effects</td><td align="left" valign="top">Adverse reactions mentioned</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Muscle pain, fatigue, brain fog, dizziness, nausea, and memory issues</p></list-item></list></td></tr><tr><td align="left" valign="top">Decision factors</td><td align="left" valign="top">Treatment choice influences</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Laboratory results, physician recommendation, and adverse effects</p></list-item></list></td></tr><tr><td align="left" valign="top">Information seeking</td><td align="left" valign="top">Behavioral patterns</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Asking for advice, sharing experience, and seeking alternatives</p></list-item></list></td></tr><tr><td align="left" valign="top">Adherence issues</td><td align="left" valign="top">Medication compliance</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Mentions discontinuation, compliance issues, and dose changes</p></list-item></list></td></tr><tr><td align="left" valign="top">Alternative treatments</td><td align="left" valign="top">Nonstatin options</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Diet changes, exercise, ezetimibe, and coenzyme Q10</p></list-item></list></td></tr><tr><td align="left" valign="top">Emotional indicators</td><td align="left" valign="top">Expressed emotions</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Frustration, confusion, hope, and anxiety</p></list-item></list></td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>AHA: American Heart Association.</p></fn><fn id="table1fn2"><p><sup>b</sup>ACC: American College of Cardiology.</p></fn><fn id="table1fn3"><p><sup>c</sup>ASCVD: atherosclerotic cardiovascular disease.</p></fn><fn id="table1fn4"><p><sup>d</sup>MI: myocardial infarction.</p></fn><fn id="table1fn5"><p><sup>e</sup>PAD: peripheral artery disease.</p></fn><fn id="table1fn6"><p><sup>f</sup>LDL-C: low-density lipoprotein cholesterol.</p></fn><fn id="table1fn7"><p><sup>g</sup>CAC: coronary artery calcium.</p></fn></table-wrap-foot></table-wrap><p>All content was analyzed as user-generated narratives. References to clinician recommendations within discussions (eg, &#x201C;my doctor recommended starting a statin&#x201D;) were coded as patient-reported physician communication rather than independently verified clinical input. Posts containing general medical guidance without a described patient-clinician interaction were not coded under the &#x201C;decision factors&#x201D; physician recommendation category. Clinician perspectives were not independently ascertained; physician-related content was captured only through users&#x2019; own accounts of clinical interactions.</p></sec><sec id="s2-5"><title>Clinical Relevance Tiering</title><p>A deterministic rule-based algorithm aligned with American Heart Association, American College of Cardiology, and US Preventive Services Task Force indicators [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>] assigned high, medium, or low clinical relevance (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). High relevance required explicit mention of ASCVD, low-density lipoprotein cholesterol &#x2265;190 mg/dL, diabetes (in individuals aged 40&#x2010;75 years), or elevated 10-year ASCVD risk, and medium relevance reflected risk-enhancing factors (eg, family history of premature ASCVD, chronic kidney disease, inflammatory conditions, and coronary artery calcium &#x2265;100 Agatston units) [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]; otherwise, discussions were low relevance. Given self-reported data, absence of criteria was coded as &#x201C;unreported,&#x201D; and tier assignment defaulted downward unless explicit evidence supported a higher tier.</p></sec><sec id="s2-6"><title>Detection of LLM-Related Content</title><p>We searched for mentions of LLM tools (eg, ChatGPT [OpenAI], Claude [Anthropic], and Google Gemini) and categorized them as (1) seeking medical advice, (2) seeking general health information, (3) sharing LLM-generated content, or (4) incidental mentions. Categories 1 to 3 were flagged for sensitivity analyses (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>).</p></sec><sec id="s2-7"><title>Validation</title><p>LLM outputs were validated via expert review (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). A stratified random sample of 50 discussions (0.9% of 5328) spanning key domains was independently assessed by 2 reviewers (a clinical informaticist and a physician) using a 5-point accuracy scale (1=very poor to 5=excellent). Interrater agreement used Cohen &#x03BA;. Reviewers also documented recurrent errors. Verbatim evidence requirements enabled direct verification of extracted labels.</p></sec><sec id="s2-8"><title>Statistical Analysis</title><p>Multivariable logistic regression identified factors associated with negative sentiment toward statins. Cluster-robust SEs were estimated at the subreddit level. Covariates were prespecified (clinical relevance tier, adverse effect mentions, adherence-related content, information-seeking behavior, specific statins, and subreddit category). Absence of a mention was coded as &#x201C;not reported.&#x201D; Diagnostics included variance inflation factors and influential observation checks. Results are reported as odds ratios with 95% CIs; 2-sided <italic>P</italic>&#x003C;.05 indicated significance.</p></sec><sec id="s2-9"><title>Ethical Considerations</title><p>This study analyzed publicly accessible Reddit posts and comments as secondary data and involved no direct contact, interaction, intervention, or attempt to reidentify users. Informed consent was not obtained because the study used publicly available online content, the investigators did not interact with users, and obtaining consent from all posters was not feasible. No compensation was provided because no participants were recruited or contacted. The study was exempt from institutional review board approval and aligned with the Association of Internet Researchers&#x2019; Internet Research: Ethical Guidelines 3.0 [<xref ref-type="bibr" rid="ref27">27</xref>].</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Dataset Characteristics and Distribution</title><p>After systematic filtering, the final dataset comprised 5328 discussions contributed by 4832 unique users across multiple Reddit communities. The most frequently represented forum was r/Cholesterol (n=2722, 51.1%). Nearly half of the discussions (n=2552, 47.9%) referenced a specific statin. The most commonly mentioned agents were rosuvastatin (n=1276, 23.9%) and atorvastatin (n=1013, 19%). Dataset characteristics and statin mentions are summarized in <xref ref-type="table" rid="table2">Table 2</xref>.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Characteristics of Reddit discussions and statin mentions (N=5328).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="2">Characteristic and category</td><td align="left" valign="bottom" colspan="2">Mentions, n (%)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="4">Document type</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Submissions (posts)</td><td align="left" valign="top" colspan="2">1661 (31.2)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Comments</td><td align="left" valign="top" colspan="2">3667 (68.8)</td></tr><tr><td align="left" valign="top" colspan="4">Source community</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>r/Cholesterol</td><td align="left" valign="top" colspan="2">2722 (51.1)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>r/PeterAttia</td><td align="left" valign="top" colspan="2">576 (10.8)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>r/AskDocs</td><td align="left" valign="top" colspan="2">300 (5.6)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>r/keto</td><td align="left" valign="top" colspan="2">92 (1.7)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>r/HeartAttack</td><td align="left" valign="top" colspan="2">87 (1.6)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>r/diabetes_t2</td><td align="left" valign="top" colspan="2">82 (1.5)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>r/stroke</td><td align="left" valign="top" colspan="2">46 (0.9)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Other subreddits</td><td align="left" valign="top" colspan="2">1423 (26.7)</td></tr><tr><td align="left" valign="top" colspan="4">Primary discussion type</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Personal experience sharing</td><td align="left" valign="top" colspan="2">3210 (60.2)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Information request</td><td align="left" valign="top" colspan="2">882 (16.6)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Medical advice provision</td><td align="left" valign="top" colspan="2">734 (13.8)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>General discussion</td><td align="left" valign="top" colspan="2">502 (9.4)</td></tr><tr><td align="left" valign="top" colspan="4">Mention of a specific statin</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Yes</td><td align="left" valign="top" colspan="2">2552 (47.9)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>No</td><td align="left" valign="top" colspan="2">2776 (52.1)</td></tr><tr><td align="left" valign="top" colspan="4">Most frequent statins<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Rosuvastatin (Crestor)</td><td align="left" valign="top" colspan="2">1276 (23.9)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Atorvastatin (Lipitor)</td><td align="left" valign="top" colspan="2">1013 (19)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Pravastatin (Pravachol)</td><td align="left" valign="top" colspan="2">279 (5.2)</td></tr><tr><td align="left" valign="top" colspan="2"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Simvastatin (Zocor)</td><td align="left" valign="top" colspan="2">211 (4)</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>Generic and brand name mentions were combined.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Thematic Analysis and Primary Discussion Topics</title><p>Thematic analysis showed that discussions most commonly focused on treatment effectiveness (3311/14,007, 23.6% of thematic mentions), followed by safety and tolerability concerns (n=2366, 16.9%) and alternative lifestyle interventions (n=2081, 14.9%; <xref ref-type="fig" rid="figure1">Figure 1</xref>). Privacy-preserving, paraphrased exemplar posts (1&#x2010;2 per major theme) and the corresponding LLM theme classifications are provided in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Quantitative distribution of themes in Reddit discussions related to statins (January 2022 to May 2025). The hierarchical tree map illustrates the primary discussion topics identified by the large language model pipeline across 5328 discussions, organized into 5 overarching thematic groups and 10 topic categories. Each discussion could receive up to 3 thematic codes; percentages represent the proportion of total thematic mentions (N=14,007). The 10 most frequent topic categories are shown; remaining thematic mentions (n=3828, 27.3%) comprised less frequent topics and are not displayed.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e85057_fig01.png"/></fig></sec><sec id="s3-3"><title>Sentiment Analysis</title><p>Overall sentiment was neutral in 34% of discussions, negative in 30.9%, and positive in 16.9%, with the remainder classified as mixed or unclear. Sentiment distributions varied significantly by community type (<italic>&#x03C7;<sub>8</sub></italic>&#x00B2;=335.7; <italic>P</italic>&#x003C;.001). The proportion of discussions with negative sentiment was substantially higher in medical advice&#x2013;seeking forums (eg, r/AskDocs: 77.3%) than in lifestyle-oriented forums (eg, r/Biohackers: 9.1%).</p></sec><sec id="s3-4"><title>Clinical Relevance Assessment</title><p>Among 5328 discussions, using guideline-informed criteria, 12.6% (n=672) of discussions were classified as high clinical relevance, 22.4% (n=1193) as medium relevance, and 65% (n=3463) as low relevance. High-relevance content was most frequent in r/stroke (40/46, 87.0%), r/HeartAttack (41/87, 47.1%), r/diabetes_t2 (29/82, 35.4%), and r/AskDocs (82/300, 27.3%). Clinical information elements were reported as follows: laboratory values (n=2048, 38.4%), cardiovascular events (n=362, 6.8%), family history (n=908, 17%), and lifestyle factors (n=2616, 49.1%).</p></sec><sec id="s3-5"><title>Adverse Effect Reports and Safety Concerns</title><p>Among 5328 discussions, adverse effects were reported in 31.9% (n=1697; 95% CI 30.7%&#x2010;33.2%) of discussions. Among discussions that referenced adverse effects, the most frequent included muscle pain (n=129, 7.6%) and fatigue (n=110, 6.5%), followed by cognitive symptoms such as &#x201C;brain fog&#x201D; (n=61, 3.6%). A detailed breakdown of adverse effects, including neuropsychiatric symptoms, is provided in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>. In 0.3% (n=17) of discussions, users explicitly stated that no adverse effects occurred.</p></sec><sec id="s3-6"><title>Decision-Making Factors and Treatment Influences</title><p>Of 5328 discussions, the most frequently coded factors associated with statin-related decisions were laboratory results (n=2767, 51.9%), physician recommendations (n=2034, 38.2%), adverse effects (n=1593, 29.9%), and family history of cardiovascular disease (n=822, 15.4%). Additional factors included lifestyle modifications (n=1092, 20.5%), online research (n=573, 10.8%), cost (n=316, 5.9%), and insurance coverage (n=72, 1.4%). Genetic predisposition and clinical guideline recommendations were each coded in 0.5% (n=26 for both) of discussions.</p></sec><sec id="s3-7"><title>Alternative Treatment Discussions</title><p>Among 5328 discussions, alternative treatments were coded in 46.6% (n=2485) of discussions. The most frequent nonpharmacologic alternatives were dietary changes (n=449, 8.4%) and exercise (n=406, 7.6%). Pharmacologic alternatives included ezetimibe (n=168, 3.2%), Repatha (n=84, 1.6%), and Zetia (n=70, 1.3%). Supplements included fish oil (n=60, 1.1%), coenzyme Q10 (n=57, 1.1%), and red yeast rice (n=53, 1%). Weight loss was coded in 1.4% (n=73) of discussions.</p></sec><sec id="s3-8"><title>Information-Seeking Behaviors and Community Engagement</title><p>Among 5328 discussions, experience sharing was coded in 78.2% (n=4167) of discussions and advice seeking was coded in 46.1% (n=2456). Discussions focused on alternative treatments occurred in 7.2% (n=386) of cases, while 5.3% (n=284) included questioning medication necessity. Advice seeking was most frequent in r/AskDocs (n=292, 97.3%).</p></sec><sec id="s3-9"><title>Emotional Indicators and Adherence Issues</title><p>Of the 5328 discussions, emotional expressions were identified in 85.2% (n=4537) of discussions. The most frequently coded emotions were frustration (n=1705, 32%) and confusion (n=911, 17.1%). Medication adherence issues were present in 29.8% (n=1587) of the discussions, including discontinuation (n=522, 9.8%) and dose modification (n=437, 8.2%). Multiple codes per discussion were permitted; therefore, percentages may sum to more than 100%.</p></sec><sec id="s3-10"><title>Mentions of LLM Tools in Reddit Discussions</title><p>Explicit mentions of LLM tools occurred in 23/5,328 (0.4%) discussions, totaling 38 mentions. Of the 38 mentions, ChatGPT accounted for 32 (84.2%), followed by other GPT variants (n=3, 7.9%) and Claude, Bard/Gemini, or DeepSeek (n=3, 7.9% combined). Mentions were coded as statin-related medical decision-making (n=2, 5.3%), information seeking (n=6, 15.8%), and general references (n=30, 78.9%). Discussions containing LLM mentions were most commonly observed in r/PeterAttia (6/23, 26.1%) and r/Cholesterol (5/23, 21.7%). Mentions increased from 6 in 2023 to 32 in January 2025 to May 2025.</p></sec><sec id="s3-11"><title>Expert Validation Results</title><p>Expert validation of a stratified sample of 50 discussions showed a mean validation score of 4.67 (SD 0.74). Interrater agreement was substantial (Cohen &#x03BA;=0.85; 95% CI 0.78-0.92). Expert feedback noted recurring coding challenges in distinguishing genetic risk factors (eg, lipoprotein[a]) from family history, as well as in identifying cardiovascular event&#x2013;related content (eg, coronary artery calcium scores).</p></sec><sec id="s3-12"><title>Statistical Associations</title><p>Sentiment distributions differed across communities (<italic>&#x03C7;</italic>&#x00B2;=335.7; <italic>P</italic>&#x003C;.001). Negative sentiment was more frequent in medical advice&#x2013;seeking communities than in lifestyle-focused communities (eg, r/AskDocs: 77.3% vs r/Biohackers: 9.1%; <italic>P</italic>&#x003C;.001). Adverse effect reporting also differed by community type (<italic>&#x03C7;<sub>2</sub></italic>&#x00B2;=124.6; <italic>P</italic>&#x003C;.001). Adverse effect mentions and adherence issues were associated with negative sentiment (<italic>P</italic>&#x003C;.001 for both). In adjusted multivariable analysis, factors associated with negative sentiment included adverse effect mentions (adjusted odds ratio [aOR] 3.42, 95% CI 2.89&#x2010;4.05; <italic>P</italic>&#x003C;.001), posts in medical advice communities (aOR 2.76, 95% CI 2.31&#x2010;3.30; <italic>P</italic>&#x003C;.001), adherence issues (aOR 2.18, 95% CI 1.84&#x2010;2.58; <italic>P</italic>&#x003C;.001), and high clinical relevance content (aOR 1.47, 95% CI 1.18&#x2010;1.84; <italic>P</italic>=.001; <xref ref-type="table" rid="table3">Table 3</xref>).</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Multivariable logistic regression of factors associated with negative sentiment.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variable</td><td align="left" valign="bottom" colspan="2">Adjusted odds ratio (95% CI)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Adverse effect mentions</td><td align="left" valign="top" colspan="2">3.42 (2.89&#x2010;4.05)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Posts in medical advice communities</td><td align="left" valign="top" colspan="2">2.76 (2.31&#x2010;3.30)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Adherence issues</td><td align="left" valign="top" colspan="2">2.18 (1.84&#x2010;2.58)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">High clinical relevance content</td><td align="left" valign="top" colspan="2">1.47 (1.18&#x2010;1.84)</td><td align="left" valign="top">.001</td></tr></tbody></table></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Main Findings</title><p>In this large-scale analysis of statin-related discussions on Reddit, patient discourse was shaped primarily by perceived adverse effects, uncertainty about benefits, and peer validation, with relatively limited reference to formal cardiovascular risk stratification. Although statins are strongly endorsed by clinical guidelines for ASCVD prevention [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref26">26</xref>], real-world patient narratives were frequently framed around experiential and emotional factors, including fear of long-term harm, symptom attribution, and ambivalence toward medical authority. This divergence between guideline-based evidence and patient-centered concerns helps explain persistently suboptimal statin adherence despite decades of robust trial data [<xref ref-type="bibr" rid="ref28">28</xref>].</p><p>Notably, fewer than 1 in 8 discussions met criteria for high clinical relevance based on American Heart Association, American College of Cardiology, and US Preventive Services Task Force risk thresholds [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. Instead, most conversations focused on nonspecific symptoms, laboratory fluctuations, or lifestyle considerations, suggesting that engagement with statin therapy often occurs outside a formal risk-benefit calculus. Therefore, effective statin counseling may require attention to patients&#x2019; beliefs and concerns, beyond clinical risk factors alone.</p></sec><sec id="s4-2"><title>The Adverse Effect Paradox: Perception vs Trial Evidence</title><p>Adverse effect concerns were prominent in our dataset (n=1697, 31.9% of discussions), which is not directly comparable to trial-based incidence estimates but may reflect a perception-evidence gap that shapes beliefs and adherence decisions. Evidence from blinded randomized trials and individual-participant meta-analyses suggests that the excess risk of muscle symptoms attributable to statins is small and that most muscle symptom reports under blinded conditions are not attributable to statin therapy [<xref ref-type="bibr" rid="ref29">29</xref>]. This divergence is consistent with nocebo-related expectation and attribution mechanisms within the broader information environment. In the Anglo-Scandinavian Cardiac Outcomes Trial&#x2013;Lipid-Lowering Arm, muscle-related adverse events were reported more frequently during the unblinded extension than during blinded treatment despite comparable exposure, supporting expectation-driven symptom attribution [<xref ref-type="bibr" rid="ref30">30</xref>].</p><p>Cognitive concerns (eg, &#x201C;brain fog&#x201D;) appeared in 3.6% (n=61) of discussions, although randomized trials have not demonstrated statin-attributable cognitive impairment [<xref ref-type="bibr" rid="ref31">31</xref>]. Regulatory agencies have noted rare, generally reversible postmarketing reports, and the prominence of such concerns online may reflect expectation-driven symptom attribution [<xref ref-type="bibr" rid="ref32">32</xref>]. Mechanistically, true statin myopathy occurs in a subset of patients, including those with <italic>SLCO1B1</italic> variants or drug-drug interactions, but the high salience of adverse effects in online communities likely reflects both heterogeneity in susceptibility and selection effects (symptomatic users preferentially posting) [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. Clinicians should anticipate that patients initiate statins within an information ecosystem that can magnify harm narratives. Proactive counseling, clear differentiation of evidence-based risks, and structured symptom assessment (eg, Statin-Associated Muscle Symptom Clinical Index) may reduce nocebo-driven discontinuation [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>].</p></sec><sec id="s4-3"><title>Emotional Burden as a Hidden Driver of Nonadherence</title><p>Beyond physical symptoms, statin discussions carried substantial emotional content (n=4537, 85.2%), with frustration (n=1705, 32%) and confusion (n=911, 17.1%) predominating. These patterns suggest that statin decisions may be shaped by emotional responses (eg, frustration and anxiety) in addition to objective risk appraisal. Negative emotion is consistently associated with poorer adherence across chronic disease contexts. A meta-analysis by DiMatteo et al [<xref ref-type="bibr" rid="ref37">37</xref>] found markedly higher nonadherence among patients with depression. Similarly, medication-specific emotional distress has been associated with treatment discontinuation, even after accounting for clinical depression [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]. In our dataset, adherence problems (n=1587, 29.8%) frequently co-occurred with adverse effect narratives and negative sentiment, suggesting a pathway in which perceived harms generate distress that undermines persistence. These emotional dimensions may be underelicited in routine care, where time-constrained visits often prioritize biomarker review and dose adjustment. Incorporating a brief assessment of medication-related distress into cardiovascular prevention workflows, paired with motivational interviewing, could identify patients at risk for emotionally driven discontinuation earlier in the treatment course.</p></sec><sec id="s4-4"><title>Community as an Information Filter: The Ecology of Online Health Discourse</title><p>Sentiment and content varied substantially across Reddit communities. Negative sentiment was more prevalent in medical advice&#x2013;seeking subreddits (eg, r/AskDocs: 77.3%) than in lifestyle-focused subreddits (eg, r/Biohackers: 9.1%). Condition-specific forums (eg, r/stroke and r/HeartAttack) contained the highest proportion of clinically relevant content, while dietary communities (eg, r/keto) more often reflected cholesterol skepticism that diverged from guideline framing [<xref ref-type="bibr" rid="ref2">2</xref>].</p><p>These patterns are consistent with community selection as an &#x201C;information filter,&#x201D; in which users preferentially encounter narratives aligned with prevailing community norms and their own concerns; similar dynamics have been described in other online health communities [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]. Such community-specific patterns may reinforce users&#x2019; existing perspectives. For example, dietary forums showed more skepticism toward statins, while condition-specific communities (eg, r/HeartAttack) contained more secondary prevention content. Therefore, community-specific outreach may be more effective than generic education. Strategies could include engaging trusted voices within skeptical forums, tailoring evidence presentation to community values, and directly addressing prevalent misconceptions (eg, &#x201C;cholesterol myth&#x201D; narratives), thereby complementing traditional patient counseling.</p></sec><sec id="s4-5"><title>The Emerging Role of Artificial Intelligence in Patient Decision-Making</title><p>Explicit mentions of LLMs were uncommon (n=23, 0.4%) but increased from 6 in 2023 to 32 in early 2025, suggesting growing uptake. Users described using tools such as ChatGPT to interpret laboratory results, weigh treatment options, and prepare questions for clinical encounters. To the best of our knowledge, few studies have quantified artificial intelligence (AI) tool use within real-world cardiovascular treatment discussions. Prior research has evaluated LLM performance on medical queries [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>], but implications for patient expectations and decision-making remain incompletely characterized. These findings raise questions about how AI-mediated information may shape patient perspectives before clinical visits, warranting further investigation and practical guidance for clinicians.</p></sec><sec id="s4-6"><title>Limitations</title><p>This study has several limitations. First, Reddit API retrieval imposes sampling constraints. Search results are not uniformly sampled. Each keyword query is capped (&#x2264;1000 submissions), and ranking algorithms can overrepresent newer posts. This may yield a recency- and visibility-biased corpus. Accordingly, theme and sentiment frequencies should be interpreted as visibility-weighted patterns within the retrieved dataset rather than population-level prevalence for all statin-related content on Reddit; this may inflate high-salience topics (eg, adverse effects, discontinuation, and emotionally charged narratives) and complicate temporal comparisons. Second, Reddit&#x2019;s pseudonymous structure prevents verification of demographics, diagnoses, lipid values, comorbidities, and outcomes. Users are unlikely to be representative of the broader statin-using population, limiting generalizability&#x2014;particularly to older adults and those with lower digital access or health literacy. Third, self-reported social media content is subject to recall bias and selective posting, potentially overrepresenting unusual or negative experiences. Fourth, although we used expert-guided prompt development and validation, LLM-based extraction may misclassify nuanced language (eg, sarcasm or irony) or clinical attribution, which could affect domain-specific estimates. Evidence-quote requirements and human validation mitigate but do not eliminate this risk. Fifth, findings are limited to 1 platform and English-language content; discourse may differ across platforms and languages. Finally, this cross-sectional design cannot establish causality, assess within-person changes, or link discourse to clinical outcomes. Because nondisclosure in social media reflects &#x201C;unreported&#x201D; rather than missing at random, our conservative handling of unreported variables may underestimate clinical relevance and attenuate associations. We mitigate these limitations through transparent reporting, stratified expert validation, and emphasis on associations rather than causal claims. Future work should consider time-stratified sampling, multiplatform triangulation, and linkage to external clinical data (eg, registries, claims, or electronic health record&#x2013;linked cohorts) where feasible.</p></sec><sec id="s4-7"><title>Conclusions</title><p>This study highlights a substantial misalignment between guideline-based statin risk stratification and the lived experiences expressed by patients online. Across 5328 Reddit discussions, discourse centered on perceived adverse effects (n=1697, 31.9%), emotional distress (n=4537, 85.2%), and mentions of &#x201C;natural&#x201D; alternatives (n=2485, 46.6%), patterns that may help explain persistent challenges in long-term adherence. These findings suggest that effective cardiovascular prevention must go beyond information provision to address nocebo effects and treatment-related frustration that shape patients&#x2019; responses to therapy. Methodologically, our validated LLM-enabled pipeline captures nuanced dimensions of treatment experience (eg, ambivalence and peer influence) that are poorly measured by conventional surveillance approaches. As patients increasingly navigate AI-mediated information environments, evidence-informed engagement with digital spaces may support shared decision-making and improve long-term outcomes.</p></sec></sec></body><back><ack><p>During manuscript preparation, the authors used ChatGPT (OpenAI) for language editing to improve clarity and readability. The tool was used only to assist with wording and expression. All artificial intelligence&#x2013;generated suggestions were critically reviewed and revised by the authors, who take full responsibility for the accuracy, integrity, and originality of the final manuscript.</p></ack><notes><sec><title>Funding</title><p>This work was supported by the National Institutes of Health (grant R00LM014097).</p></sec><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are not publicly available because sharing Reddit-derived data could increase the risk of user traceability and would be inconsistent with the study&#x2019;s privacy protections.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: SL, JL</p><p>Data curation: SL</p><p>Formal analysis: SL</p><p>Investigation: SL</p><p>Methodology: SL, JL</p><p>Software: SL</p><p>Writing&#x2014;original draft: SL</p><p>Writing&#x2014;review and editing: SL, JL</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI </term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">aOR</term><def><p>adjusted odds ratio</p></def></def-item><def-item><term id="abb3">API</term><def><p>application programming interface</p></def></def-item><def-item><term id="abb4">ASCVD</term><def><p>atherosclerotic cardiovascular disease</p></def></def-item><def-item><term id="abb5">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb6">PRISMA</term><def><p>Preferred Reporting Items for Systematic Reviews and Meta-Analyses</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Collins</surname><given-names>R</given-names> </name><name name-style="western"><surname>Reith</surname><given-names>C</given-names> </name><name name-style="western"><surname>Emberson</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Interpretation of the evidence for the efficacy and safety of statin therapy</article-title><source>Lancet</source><year>2016</year><month>11</month><day>19</day><volume>388</volume><issue>10059</issue><fpage>2532</fpage><lpage>2561</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(16)31357-5</pub-id><pub-id pub-id-type="medline">27616593</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Grundy</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Stone</surname><given-names>NJ</given-names> </name><name name-style="western"><surname>Bailey</surname><given-names>AL</given-names> </name><etal/></person-group><article-title>2018 AHA/ACC/AACVPR/AAPA/ABC/ACPM/ADA/AGS/APhA/ASPC/NLA/PCNA guideline on the management of blood cholesterol: executive summary: a report of the American College of Cardiology/American Heart Association Task Force on Clinical Practice Guidelines</article-title><source>J Am Coll Cardiol</source><year>2019</year><month>06</month><day>25</day><volume>73</volume><issue>24</issue><fpage>3168</fpage><lpage>3209</lpage><pub-id pub-id-type="doi">10.1016/j.jacc.2018.11.002</pub-id><pub-id pub-id-type="medline">30423391</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Visseren</surname><given-names>FLJ</given-names> </name><name name-style="western"><surname>Mach</surname><given-names>F</given-names> </name><name name-style="western"><surname>Smulders</surname><given-names>YM</given-names> </name><etal/></person-group><article-title>2021 ESC Guidelines on cardiovascular disease prevention in clinical practice</article-title><source>Eur J Prev Cardiol</source><year>2022</year><month>02</month><day>19</day><volume>29</volume><issue>1</issue><fpage>5</fpage><lpage>115</lpage><pub-id pub-id-type="doi">10.1093/eurjpc/zwab154</pub-id><pub-id pub-id-type="medline">34558602</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Plutzky</surname><given-names>J</given-names> </name><name name-style="western"><surname>Skentzos</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Discontinuation of statins in routine care settings: a cohort study</article-title><source>Ann Intern Med</source><year>2013</year><month>04</month><day>2</day><volume>158</volume><issue>7</issue><fpage>526</fpage><lpage>534</lpage><pub-id pub-id-type="doi">10.7326/0003-4819-158-7-201304020-00004</pub-id><pub-id pub-id-type="medline">23546564</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Basios</surname><given-names>A</given-names> </name><name name-style="western"><surname>Markozannes</surname><given-names>G</given-names> </name><name name-style="western"><surname>Ntzani</surname><given-names>EE</given-names> </name><etal/></person-group><article-title>Prevalence and determinants of adherence to statin therapy: a systematic review and meta-analysis</article-title><source>Eur J Prev Cardiol</source><year>2025</year><month>12</month><day>16</day><fpage>zwaf769</fpage><pub-id pub-id-type="doi">10.1093/eurjpc/zwaf769</pub-id><pub-id pub-id-type="medline">41401202</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vinogradova</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Coupland</surname><given-names>C</given-names> </name><name name-style="western"><surname>Brindle</surname><given-names>P</given-names> </name><name name-style="western"><surname>Hippisley-Cox</surname><given-names>J</given-names> </name></person-group><article-title>Discontinuation and restarting in patients on statin treatment: prospective open cohort study using a primary care database</article-title><source>BMJ</source><year>2016</year><month>06</month><day>28</day><volume>353</volume><fpage>i3305</fpage><pub-id pub-id-type="doi">10.1136/bmj.i3305</pub-id><pub-id pub-id-type="medline">27353261</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Anker</surname><given-names>SD</given-names> </name><name name-style="western"><surname>Agewall</surname><given-names>S</given-names> </name><name name-style="western"><surname>Borggrefe</surname><given-names>M</given-names> </name><etal/></person-group><article-title>The importance of patient-reported outcomes: a call for their comprehensive integration in cardiovascular clinical trials</article-title><source>Eur Heart J</source><year>2014</year><month>08</month><day>7</day><volume>35</volume><issue>30</issue><fpage>2001</fpage><lpage>2009</lpage><pub-id pub-id-type="doi">10.1093/eurheartj/ehu205</pub-id><pub-id pub-id-type="medline">24904027</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Magnani</surname><given-names>JW</given-names> </name><name name-style="western"><surname>Mujahid</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Aronow</surname><given-names>HD</given-names> </name><etal/></person-group><article-title>Health literacy and cardiovascular disease: fundamental relevance to primary and secondary prevention: a scientific statement from the American Heart Association</article-title><source>Circulation</source><year>2018</year><month>07</month><day>10</day><volume>138</volume><issue>2</issue><fpage>e48</fpage><lpage>e74</lpage><pub-id pub-id-type="doi">10.1161/CIR.0000000000000579</pub-id><pub-id pub-id-type="medline">29866648</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brinton</surname><given-names>EA</given-names> </name></person-group><article-title>Understanding patient adherence and concerns with STatins and MedicatION Discussions With Physicians (ACTION): a survey on the patient perspective of dialogue with healthcare providers regarding statin therapy</article-title><source>Clin Cardiol</source><year>2018</year><month>06</month><volume>41</volume><issue>6</issue><fpage>710</fpage><lpage>720</lpage><pub-id pub-id-type="doi">10.1002/clc.22975</pub-id><pub-id pub-id-type="medline">29749101</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lardon</surname><given-names>J</given-names> </name><name name-style="western"><surname>Abdellaoui</surname><given-names>R</given-names> </name><name name-style="western"><surname>Bellet</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Adverse drug reaction identification and extraction in social media: a scoping review</article-title><source>J Med Internet Res</source><year>2015</year><month>07</month><day>10</day><volume>17</volume><issue>7</issue><fpage>e171</fpage><pub-id pub-id-type="doi">10.2196/jmir.4304</pub-id><pub-id pub-id-type="medline">26163365</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nikfarjam</surname><given-names>A</given-names> </name><name name-style="western"><surname>Sarker</surname><given-names>A</given-names> </name><name name-style="western"><surname>O&#x2019;Connor</surname><given-names>K</given-names> </name><name name-style="western"><surname>Ginn</surname><given-names>R</given-names> </name><name name-style="western"><surname>Gonzalez</surname><given-names>G</given-names> </name></person-group><article-title>Pharmacovigilance from social media: mining adverse drug reaction mentions using sequence labeling with word embedding cluster features</article-title><source>J Am Med Inform Assoc</source><year>2015</year><month>05</month><volume>22</volume><issue>3</issue><fpage>671</fpage><lpage>681</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocu041</pub-id><pub-id pub-id-type="medline">25755127</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Golder</surname><given-names>S</given-names> </name><name name-style="western"><surname>O&#x2019;Connor</surname><given-names>K</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Klein</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gonzalez Hernandez</surname><given-names>G</given-names> </name></person-group><article-title>The value of social media analysis for adverse events detection and pharmacovigilance: scoping review</article-title><source>JMIR Public Health Surveill</source><year>2024</year><month>09</month><day>6</day><volume>10</volume><fpage>e59167</fpage><pub-id pub-id-type="doi">10.2196/59167</pub-id><pub-id pub-id-type="medline">39240684</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Somani</surname><given-names>S</given-names> </name><name name-style="western"><surname>van Buchem</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Sarraju</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hernandez-Boussard</surname><given-names>T</given-names> </name><name name-style="western"><surname>Rodriguez</surname><given-names>F</given-names> </name></person-group><article-title>Artificial intelligence-enabled analysis of statin-related topics and sentiments on social media</article-title><source>JAMA Netw Open</source><year>2023</year><month>04</month><day>3</day><volume>6</volume><issue>4</issue><fpage>e239747</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.9747</pub-id><pub-id pub-id-type="medline">37093597</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="web"><article-title>Press - Reddit</article-title><source>Reddit</source><access-date>2025-05-20</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.redditinc.com/press">https://www.redditinc.com/press</ext-link></comment></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rupert</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Gard Read</surname><given-names>J</given-names> </name><name name-style="western"><surname>Amoozegar</surname><given-names>JB</given-names> </name><etal/></person-group><article-title>Peer-generated health information: the role of online communities in patient and caregiver health decisions</article-title><source>J Health Commun</source><year>2016</year><month>11</month><volume>21</volume><issue>11</issue><fpage>1187</fpage><lpage>1197</lpage><pub-id pub-id-type="doi">10.1080/10810730.2016.1237592</pub-id><pub-id pub-id-type="medline">27805496</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Golder</surname><given-names>S</given-names> </name><name name-style="western"><surname>O&#x2019;Connor</surname><given-names>K</given-names> </name><name name-style="western"><surname>Hennessy</surname><given-names>S</given-names> </name><name name-style="western"><surname>Gross</surname><given-names>R</given-names> </name><name name-style="western"><surname>Gonzalez-Hernandez</surname><given-names>G</given-names> </name></person-group><article-title>Assessment of beliefs and attitudes about statins posted on Twitter: a qualitative study</article-title><source>JAMA Netw Open</source><year>2020</year><month>06</month><day>1</day><volume>3</volume><issue>6</issue><fpage>e208953</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2020.8953</pub-id><pub-id pub-id-type="medline">32584408</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moorhead</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Hazlett</surname><given-names>DE</given-names> </name><name name-style="western"><surname>Harrison</surname><given-names>L</given-names> </name><name name-style="western"><surname>Carroll</surname><given-names>JK</given-names> </name><name name-style="western"><surname>Irwin</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hoving</surname><given-names>C</given-names> </name></person-group><article-title>A new dimension of health care: systematic review of the uses, benefits, and limitations of social media for health communication</article-title><source>J Med Internet Res</source><year>2013</year><month>04</month><day>23</day><volume>15</volume><issue>4</issue><fpage>e85</fpage><pub-id pub-id-type="doi">10.2196/jmir.1933</pub-id><pub-id pub-id-type="medline">23615206</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bedi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Orr-Ewing</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Testing and evaluation of health care applications of large language models: a systematic review</article-title><source>JAMA</source><year>2025</year><month>01</month><day>28</day><volume>333</volume><issue>4</issue><fpage>319</fpage><lpage>328</lpage><pub-id pub-id-type="doi">10.1001/jama.2024.21700</pub-id><pub-id pub-id-type="medline">39405325</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Goglia</surname><given-names>D</given-names> </name><name name-style="western"><surname>Vega</surname><given-names>D</given-names> </name></person-group><article-title>Structure and dynamics of growing networks of Reddit threads</article-title><source>Appl Netw Sci</source><year>2024</year><volume>9</volume><fpage>48</fpage><pub-id pub-id-type="doi">10.1007/s41109-024-00654-y</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Golder</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ahmed</surname><given-names>S</given-names> </name><name name-style="western"><surname>Norman</surname><given-names>G</given-names> </name><name name-style="western"><surname>Booth</surname><given-names>A</given-names> </name></person-group><article-title>Attitudes toward the ethics of research using social media: a systematic review</article-title><source>J Med Internet Res</source><year>2017</year><month>06</month><day>6</day><volume>19</volume><issue>6</issue><fpage>e195</fpage><pub-id pub-id-type="doi">10.2196/jmir.7082</pub-id><pub-id pub-id-type="medline">28588006</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="web"><article-title>Language identification</article-title><source>FastText</source><access-date>2025-05-20</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://fasttext.cc/docs/en/language-identification.html">https://fasttext.cc/docs/en/language-identification.html</ext-link></comment></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Broder</surname><given-names>AZ</given-names> </name></person-group><article-title>On the resemblance and containment of documents</article-title><conf-name>Compression and Complexity of SEQUENCES 1997</conf-name><conf-date>Jun 13, 1997</conf-date><pub-id pub-id-type="doi">10.1109/SEQUEN.1997.666900</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="web"><article-title>Introducing GPT-4.1 in the API</article-title><source>OpenAI</source><year>2025</year><access-date>2025-04-14</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://openai.com/index/gpt-4-1/">https://openai.com/index/gpt-4-1/</ext-link></comment></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Croskerry</surname><given-names>P</given-names> </name></person-group><article-title>A universal model of diagnostic reasoning</article-title><source>Acad Med</source><year>2009</year><month>08</month><volume>84</volume><issue>8</issue><fpage>1022</fpage><lpage>1028</lpage><pub-id pub-id-type="doi">10.1097/ACM.0b013e3181ace703</pub-id><pub-id pub-id-type="medline">19638766</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Grundy</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Stone</surname><given-names>NJ</given-names> </name><name name-style="western"><surname>Bailey</surname><given-names>AL</given-names> </name><etal/></person-group><article-title>2018 AHA/ACC/AACVPR/AAPA/ABC/ACPM/ADA/AGS/APhA/ASPC/NLA/PCNA guideline on the management of blood cholesterol: a report of the American College of Cardiology/American Heart Association Task Force on Clinical Practice Guidelines</article-title><source>Circulation</source><year>2019</year><month>06</month><day>18</day><volume>139</volume><issue>25</issue><fpage>e1082</fpage><lpage>e1143</lpage><pub-id pub-id-type="doi">10.1161/CIR.0000000000000625</pub-id><pub-id pub-id-type="medline">30586774</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>US Preventive Services Task Force</collab><name name-style="western"><surname>Mangione</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Barry</surname><given-names>MJ</given-names> </name><etal/></person-group><article-title>Statin use for the primary prevention of cardiovascular disease in adults: US Preventive Services Task Force recommendation statement</article-title><source>JAMA</source><year>2022</year><month>08</month><day>23</day><volume>328</volume><issue>8</issue><fpage>746</fpage><lpage>753</lpage><pub-id pub-id-type="doi">10.1001/jama.2022.13044</pub-id><pub-id pub-id-type="medline">35997723</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="report"><person-group person-group-type="author"><name name-style="western"><surname>Franzke</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Bechmann</surname><given-names>A</given-names> </name><name name-style="western"><surname>Zimmer</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ess</surname><given-names>C</given-names> </name></person-group><article-title>Internet research: ethical guidelines 3.0</article-title><source>Association of Internet Researchers</source><year>2020</year><access-date>2026-04-06</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://aoir.org/reports/ethics3.pdf">https://aoir.org/reports/ethics3.pdf</ext-link></comment></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ingersgaard</surname><given-names>MV</given-names> </name><name name-style="western"><surname>Helms Andersen</surname><given-names>T</given-names> </name><name name-style="western"><surname>Norgaard</surname><given-names>O</given-names> </name><name name-style="western"><surname>Grabowski</surname><given-names>D</given-names> </name><name name-style="western"><surname>Olesen</surname><given-names>K</given-names> </name></person-group><article-title>Reasons for nonadherence to statins - a systematic review of reviews</article-title><source>Patient Prefer Adherence</source><year>2020</year><volume>14</volume><fpage>675</fpage><lpage>691</lpage><pub-id pub-id-type="doi">10.2147/PPA.S245365</pub-id><pub-id pub-id-type="medline">32308373</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>Cholesterol Treatment Trialists&#x2019; Collaboration</collab></person-group><article-title>Effect of statin therapy on muscle symptoms: an individual participant data meta-analysis of large-scale, randomised, double-blind trials</article-title><source>Lancet</source><year>2022</year><month>09</month><day>10</day><volume>400</volume><issue>10355</issue><fpage>832</fpage><lpage>845</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(22)01545-8</pub-id><pub-id pub-id-type="medline">36049498</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gupta</surname><given-names>A</given-names> </name><name name-style="western"><surname>Thompson</surname><given-names>D</given-names> </name><name name-style="western"><surname>Whitehouse</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Adverse events associated with unblinded, but not with blinded, statin therapy in the Anglo-Scandinavian Cardiac Outcomes Trial-Lipid-Lowering Arm (ASCOT-LLA): a randomised double-blind placebo-controlled trial and its non-randomised non-blind extension phase</article-title><source>Lancet</source><year>2017</year><month>06</month><day>24</day><volume>389</volume><issue>10088</issue><fpage>2473</fpage><lpage>2481</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(17)31075-9</pub-id><pub-id pub-id-type="medline">28476288</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Ryan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ernst</surname><given-names>ME</given-names> </name><etal/></person-group><article-title>Effect of statin therapy on cognitive decline and incident dementia in older adults</article-title><source>J Am Coll Cardiol</source><year>2021</year><month>06</month><day>29</day><volume>77</volume><issue>25</issue><fpage>3145</fpage><lpage>3156</lpage><pub-id pub-id-type="doi">10.1016/j.jacc.2021.04.075</pub-id><pub-id pub-id-type="medline">34167639</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="web"><article-title>Cholesterol-lowering drugs get labeling changes</article-title><source>U.S. Food and Drug Administration</source><year>2015</year><access-date>2025-11-10</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.fda.gov/drugs/special-features/cholesterol-lowering-drugs-get-labeling-changes">https://www.fda.gov/drugs/special-features/cholesterol-lowering-drugs-get-labeling-changes</ext-link></comment></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cooper-DeHoff</surname><given-names>RM</given-names> </name><name name-style="western"><surname>Niemi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ramsey</surname><given-names>LB</given-names> </name><etal/></person-group><article-title>The Clinical Pharmacogenetics Implementation Consortium Guideline for SLCO1B1, ABCG2, and CYP2C9 genotypes and statin-associated musculoskeletal symptoms</article-title><source>Clin Pharmacol Ther</source><year>2022</year><month>05</month><volume>111</volume><issue>5</issue><fpage>1007</fpage><lpage>1021</lpage><pub-id pub-id-type="doi">10.1002/cpt.2557</pub-id><pub-id pub-id-type="medline">35152405</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>SEARCH Collaborative Group</collab><name name-style="western"><surname>Link</surname><given-names>E</given-names> </name><name name-style="western"><surname>Parish</surname><given-names>S</given-names> </name><etal/></person-group><article-title>SLCO1B1 variants and statin-induced myopathy--a genomewide study</article-title><source>N Engl J Med</source><year>2008</year><month>08</month><day>21</day><volume>359</volume><issue>8</issue><fpage>789</fpage><lpage>799</lpage><pub-id pub-id-type="doi">10.1056/NEJMoa0801936</pub-id><pub-id pub-id-type="medline">18650507</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Howard</surname><given-names>JP</given-names> </name><name name-style="western"><surname>Wood</surname><given-names>FA</given-names> </name><name name-style="western"><surname>Finegold</surname><given-names>JA</given-names> </name><etal/></person-group><article-title>Side effect patterns in a crossover trial of statin, placebo, and no treatment</article-title><source>J Am Coll Cardiol</source><year>2021</year><month>09</month><day>21</day><volume>78</volume><issue>12</issue><fpage>1210</fpage><lpage>1222</lpage><pub-id pub-id-type="doi">10.1016/j.jacc.2021.07.022</pub-id><pub-id pub-id-type="medline">34531021</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rosenson</surname><given-names>RS</given-names> </name><name name-style="western"><surname>Miller</surname><given-names>K</given-names> </name><name name-style="western"><surname>Bayliss</surname><given-names>M</given-names> </name><etal/></person-group><article-title>The Statin-Associated Muscle Symptom Clinical Index (SAMS-CI): revision for clinical use, content validation, and inter-rater reliability</article-title><source>Cardiovasc Drugs Ther</source><year>2017</year><month>04</month><volume>31</volume><issue>2</issue><fpage>179</fpage><lpage>186</lpage><pub-id pub-id-type="doi">10.1007/s10557-017-6723-4</pub-id><pub-id pub-id-type="medline">28421332</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>DiMatteo</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Lepper</surname><given-names>HS</given-names> </name><name name-style="western"><surname>Croghan</surname><given-names>TW</given-names> </name></person-group><article-title>Depression is a risk factor for noncompliance with medical treatment: meta-analysis of the effects of anxiety and depression on patient adherence</article-title><source>Arch Intern Med</source><year>2000</year><month>07</month><day>24</day><volume>160</volume><issue>14</issue><fpage>2101</fpage><lpage>2107</lpage><pub-id pub-id-type="doi">10.1001/archinte.160.14.2101</pub-id><pub-id pub-id-type="medline">10904452</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hoogendoorn</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Krause-Steinrauf</surname><given-names>H</given-names> </name><name name-style="western"><surname>Uschner</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Emotional distress predicts reduced type 2 diabetes treatment adherence in the Glycemia Reduction Approaches in Diabetes: a comparative effectiveness study (GRADE)</article-title><source>Diabetes Care</source><year>2024</year><month>04</month><day>1</day><volume>47</volume><issue>4</issue><fpage>629</fpage><lpage>637</lpage><pub-id pub-id-type="doi">10.2337/dc23-1401</pub-id><pub-id pub-id-type="medline">38227900</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gonzalez</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Shreck</surname><given-names>E</given-names> </name><name name-style="western"><surname>Psaros</surname><given-names>C</given-names> </name><name name-style="western"><surname>Safren</surname><given-names>SA</given-names> </name></person-group><article-title>Distress and type 2 diabetes-treatment adherence: a mediating role for perceived control</article-title><source>Health Psychol</source><year>2015</year><month>05</month><volume>34</volume><issue>5</issue><fpage>505</fpage><lpage>513</lpage><pub-id pub-id-type="doi">10.1037/hea0000131</pub-id><pub-id pub-id-type="medline">25110840</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chou</surname><given-names>WYS</given-names> </name><name name-style="western"><surname>Oh</surname><given-names>A</given-names> </name><name name-style="western"><surname>Klein</surname><given-names>WMP</given-names> </name></person-group><article-title>Addressing health-related misinformation on social media</article-title><source>JAMA</source><year>2018</year><month>12</month><day>18</day><volume>320</volume><issue>23</issue><fpage>2417</fpage><lpage>2418</lpage><pub-id pub-id-type="doi">10.1001/jama.2018.16865</pub-id><pub-id pub-id-type="medline">30428002</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bode</surname><given-names>L</given-names> </name><name name-style="western"><surname>Vraga</surname><given-names>EK</given-names> </name></person-group><article-title>See something, say something: correction of global health misinformation on social media</article-title><source>Health Commun</source><year>2018</year><month>09</month><volume>33</volume><issue>9</issue><fpage>1131</fpage><lpage>1140</lpage><pub-id pub-id-type="doi">10.1080/10410236.2017.1331312</pub-id><pub-id pub-id-type="medline">28622038</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wei</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Yao</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Cui</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wei</surname><given-names>B</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>X</given-names> </name></person-group><article-title>Evaluation of ChatGPT-generated medical responses: a systematic review and meta-analysis</article-title><source>J Biomed Inform</source><year>2024</year><month>03</month><volume>151</volume><fpage>104620</fpage><pub-id pub-id-type="doi">10.1016/j.jbi.2024.104620</pub-id><pub-id pub-id-type="medline">38462064</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Okuhara</surname><given-names>T</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Performance of ChatGPT across different versions in medical licensing examinations worldwide: systematic review and meta-analysis</article-title><source>J Med Internet Res</source><year>2024</year><month>07</month><day>25</day><volume>26</volume><fpage>e60807</fpage><pub-id pub-id-type="doi">10.2196/60807</pub-id><pub-id pub-id-type="medline">39052324</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Data cleaning and filtering.</p><media xlink:href="jmir_v28i1e85057_app1.docx" xlink:title="DOCX File, 18 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Large language model&#x2013;based extraction protocol and prompt.</p><media xlink:href="jmir_v28i1e85057_app2.docx" xlink:title="DOCX File, 26 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Expert validation protocol.</p><media xlink:href="jmir_v28i1e85057_app3.docx" xlink:title="DOCX File, 32 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Example posts with large language model&#x2013;derived theme and sentiment classifications.</p><media xlink:href="jmir_v28i1e85057_app4.docx" xlink:title="DOCX File, 17 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Frequency of specific adverse effects mentioned in Reddit discussions on statin therapy.</p><media xlink:href="jmir_v28i1e85057_app5.docx" xlink:title="DOCX File, 20 KB"/></supplementary-material></app-group></back></article>