<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id><journal-id journal-id-type="publisher-id">jmir</journal-id><journal-id journal-id-type="index">1</journal-id><journal-title>Journal of Medical Internet Research</journal-title><abbrev-journal-title>J Med Internet Res</abbrev-journal-title><issn pub-type="epub">1438-8871</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v27i1e79454</article-id><article-id pub-id-type="doi">10.2196/79454</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Intersection of Big Five Personality Traits and Substance Use on Social Media Discourse: AI-Powered Observational Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Maharjan</surname><given-names>Julina</given-names></name><degrees>BE, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Jin</surname><given-names>Ruoming</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhu</surname><given-names>Jianfeng</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kenne</surname><given-names>Deric</given-names></name><degrees>Prof Dr</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Computer Science, Kent State University</institution><addr-line>800 East Summit Street</addr-line><addr-line>Kent</addr-line><addr-line>OH</addr-line><country>United States</country></aff><aff id="aff2"><institution>Department of Public Health, Kent State University</institution><addr-line>Kent</addr-line><addr-line>OH</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib><contrib contrib-type="editor"><name name-style="western"><surname>Brini</surname><given-names>Stefano</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Adepoju</surname><given-names>Adewumi</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Mourelatos</surname><given-names>Evangelos</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Roos</surname><given-names>John Magnus</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Anukam</surname><given-names>Stella</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Julina Maharjan, BE, PhD, Department of Computer Science, Kent State University, 800 East Summit Street, Kent, OH, 44242, United States, 1 3305931365; <email>jmaharja@kent.edu</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>19</day><month>12</month><year>2025</year></pub-date><volume>27</volume><elocation-id>e79454</elocation-id><history><date date-type="received"><day>21</day><month>06</month><year>2025</year></date><date date-type="rev-recd"><day>15</day><month>10</month><year>2025</year></date><date date-type="accepted"><day>16</day><month>10</month><year>2025</year></date></history><copyright-statement>&#x00A9; Julina Maharjan, Ruoming Jin, Jianfeng Zhu, Deric Kenne. Originally published in the Journal of Medical Internet Research (<ext-link ext-link-type="uri" xlink:href="https://www.jmir.org">https://www.jmir.org</ext-link>), 19.12.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.jmir.org/">https://www.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.jmir.org/2025/1/e79454"/><abstract><sec><title>Background</title><p>Personality traits are known predictors of substance use (SU), but their expression and association with SU in digital discourse remain largely unexamined. During the COVID-19 pandemic, the online social engagement heightened and led to an amplification in SU rates, thereby creating a unique natural opportunity to investigate these dynamics through large-scale digital discourse data. In our study, we offer insights beyond traditional self-report methods, which are crucial for developing timely and targeted public health interventions.</p></sec><sec><title>Objective</title><p>We aim to evaluate whether the associations between the Big Five personality traits and SU discourse shifted during the 2019&#x2010;2021 period, and to conduct a focused analysis of how these traits predict SU and relate to specific substance types, emotional expression, and demographic factors.</p></sec><sec sec-type="methods"><title>Methods</title><p>We analyzed a corpus of several hundred million public posts from a major social media platform from 2019 to 2021. Using a pipeline of natural language processing and deep learning models, we identified SU-related posts and subsequently extracted scores for the Big Five personality traits, emotions, and user demographics. We used trend analysis to compare annual shifts in trait-SU associations, while detailed 2020 data underwent rigorous modeling using logistic regression, correlation analysis, and topic modeling to elucidate the core relationships.</p></sec><sec sec-type="results"><title>Results</title><p>Our analysis revealed that Extraversion (odds ratio [OR] 3.22, 95% CI 2.98-3.49) and, most strikingly, agreeableness (OR 4.04, 95% CI 3.71-4.41) were the strongest positive predictors of being a substance user. In stark contrast to the conventional self-medication hypothesis, neuroticism emerged as a robust protective factor against SU (OR 0.29, 95% CI 0.26-0.31). This counterintuitive finding was supported by a decreased association between neuroticism and SU posts at the pandemic&#x2019;s onset in 2020 (Cohen <italic>d</italic>=&#x2212;0.13, 95% CI) and a negative correlation with the expression of negative emotions online. Topic modeling further indicated that SU discourse was frequently embedded in social contexts (social drinking and friendly beverage choices) rather than themes of solitary coping.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Our findings challenge traditional models by demonstrating that in large-scale online discourse, SU expression is more powerfully linked to social-affiliative traits than to negative emotionality. The paradoxical protective role of neuroticism suggests that established risk profiles may not apply uniformly to digital environments, particularly during a public health crisis. These insights are vital for refining computational methods for public health surveillance and developing interventions that recognize the potent social drivers of SU in the digital age.</p></sec></abstract><kwd-group><kwd>agreeableness</kwd><kwd>extraversion</kwd><kwd>neuroticism</kwd><kwd>openness</kwd><kwd>conscientiousness</kwd><kwd>Big Five personality traits</kwd><kwd>substance use</kwd><kwd>natural language processing</kwd><kwd>NLP</kwd><kwd>deep learning</kwd><kwd>social media</kwd><kwd>X</kwd><kwd>COVID-19</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>Personality traits are established predictors of substance use (SU), shaping both vulnerability to and protection from risky behaviors [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. The Five-Factor Model of personality, which defines personality through the core dimensions of openness, conscientiousness, extraversion, agreeableness, and neuroticism, provides a robust framework for this purpose [<xref ref-type="bibr" rid="ref3">3</xref>]. The brief description that characterizes each trait, along with the dimension intended to measure, is highlighted in <xref ref-type="other" rid="box1">Textbox 1</xref>.</p><p>For decades, a rich body of research has established foundational links between these personality traits and risky health behaviors, including smoking, excessive alcohol consumption, and poor dietary choices, with high neuroticism and low conscientiousness consistently emerging as key vulnerability factors [<xref ref-type="bibr" rid="ref4">4</xref>]. Within this broader behavioral landscape, these traits also shape vulnerability to SU, influencing both initiation and maintenance of risky consumption patterns [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. The association between personality and SU is not monolithic; specific traits consistently emerge as powerful risk or protective factors. High neuroticism, the predisposition to negative emotions, is a robust predictor of SU, as individuals may turn to substances to self-medicate or manage pervasive anxiety [<xref ref-type="bibr" rid="ref6">6</xref>]. Conversely, high conscientiousness, characterized by prudence and self-discipline, is a significant protective factor against the impulsivity inherent in substance misuse [<xref ref-type="bibr" rid="ref8">8</xref>]. The roles of other traits are more nuanced: the reward-seeking facets of extraversion can increase initiation in social settings, the curiosity of openness can drive experimentation, and the antagonism of low agreeableness can foster risk through nonconformity [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref9">9</xref>].</p><boxed-text id="box1"><title> . Overview of Big Five personality traits.</title><p>Openness: represents an individual&#x2019;s level of curiosity, imagination, and willingness to try new things.</p><p>Conscientiousness: reflects how organized, responsible, and detail-oriented an individual is.</p><p>Extraversion: indicates how outgoing, sociable, and energetic an individual is.</p><p>Agreeableness: measures how cooperative, trusting, and kind an individual is.</p><p>Neuroticism: represents the level of emotional instability, anxiety, and mood swings an individual experiences.</p></boxed-text><p>At the same time, personality expression on social media is shaped by norms of digital self-presentation and impression management. Individuals often adapt their communication to maintain a favorable or socially desirable image in public online spaces. This framing is particularly relevant for traits such as agreeableness, which may manifest as affiliative, communal, or prosocial discourse even when discussing behaviors such as drinking or drug use. Thus, the personality-SU link on social media may reflect not only underlying psychological dispositions but also the performative dimensions of digital interaction.</p><p>Against this backdrop, major societal disruptions provide unique opportunities to observe how established trait-behavior relationships may shift under conditions of collective stress. The COVID-19 pandemic represents one such exogenous shock: while no longer the central motivation of this study, it created an unparalleled context in which SU behaviors and digital expression were amplified [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. The pandemic functioned as a natural experiment for several reasons. First, it imposed sudden, widespread changes to daily routines, social interaction, and stress levels across diverse populations, creating variation in environmental conditions that could influence SU behaviors. Second, it triggered a simultaneous increase in online social engagement, producing rich, time-stamped digital traces that allowed for the observation of behavior in near real time. Third, because the event was unplanned and affected populations broadly, it reduced potential confounding from self-selection into specific contexts, providing a rare opportunity to examine how personality traits interact with situational stressors to shape SU discourse. Enforced isolation, for example, may have transformed extraversion from a facilitator of recreational use into a risk factor for coping with loneliness [<xref ref-type="bibr" rid="ref11">11</xref>]. Situations of this magnitude challenge traditional research methodologies, as controlled experiments or surveys often lack ecological validity to capture authentic behavioral expressions under rapidly shifting societal conditions [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref14">14</xref>].</p><p>This methodological gap is particularly salient given the surge in digital communication during the pandemic. Platforms such as Twitter (subsequently rebranded X; X Corp) became central arenas for processing the crisis, creating rich new sources of naturalistic behavioral data. This development has coincided with advances in computational social science, which enable the assessment of psychological states, including personality, through the analysis of natural language at a scale and temporal precision previously unimaginable [<xref ref-type="bibr" rid="ref15">15</xref>]. These digital phenotyping approaches capture authentic linguistic markers of personality in real-world contexts, offering an unprecedented opportunity to examine how the relationship between dispositional traits and SU discourse was reshaped by the pandemic.</p></sec><sec id="s1-2"><title>Literature Review</title><sec id="s1-2-1"><title>Big Five Personality Traits and Their Relationship With SU</title><p>A robust consensus exists regarding the general relationship between the Big Five personality dimensions and SU [<xref ref-type="bibr" rid="ref2">2</xref>]. A &#x201C;problem-behavior&#x201D; profile consistently emerges from meta-analyses and large-scale studies, centrally featuring high neuroticism and low conscientiousness. Neuroticism, the tendency to experience negative emotions such as anxiety and depression, is a powerful predictor of both SU initiation and the development of substance use disorders (SUDs). The prevailing self-medication hypothesis posits that individuals high in this trait turn to substances to cope with or temporarily alleviate their emotional distress [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Complementing this, low conscientiousness, characterized by impulsivity, poor planning, and a deficit in self-discipline, is strongly linked to a general propensity for risky health behaviors, including the misuse of a wide range of substances [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref17">17</xref>].</p><p>The roles of the other major traits are more nuanced. High extraversion, particularly its facet of sensation-seeking, is often associated with the initiation of recreational SU in social contexts, driven by a desire for stimulation and positive affect. Openness to experience, which reflects intellectual curiosity and a preference for novelty, is frequently linked to experimentation with drugs, especially cannabis and hallucinogens. Finally, low agreeableness, which involves antagonism and nonconformity, can increase SU risk through pathways of social deviance and a disregard for prohibitive social norms [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref18">18</xref>].</p></sec><sec id="s1-2-2"><title>Specificity in Trait-Drug Relationships</title><p>Beyond a general vulnerability, research increasingly reveals that specific traits predispose individuals to use particular classes of drugs, aligning with distinct motivational pathways. For instance, the strong link between neuroticism and SU is most pronounced for depressants such as alcohol and opioids, which are perceived to dampen anxiety and align with a negative reinforcement or &#x201C;coping&#x201D; model of use [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. In contrast, extraversion is more directly predictive of stimulant use such as cocaine and amphetamines, which enhances social energy and reward, reflecting a positive reinforcement pathway [<xref ref-type="bibr" rid="ref21">21</xref>]. The established connection between openness and the use of cannabis and psychedelics is often driven by motives related to cognitive and perceptual expansion rather than social facilitation or distress-coping [<xref ref-type="bibr" rid="ref15">15</xref>]. This evidence suggests that personality does not merely predict if someone will use substances, but often what they will use and why.</p></sec><sec id="s1-2-3"><title>The Moderating Role of Demographics: Age and Gender</title><p>The strength and expression of these personality-SU relationships are further moderated by key demographic factors. Age is a critical variable, as the influence of certain traits evolves across the lifespan. The impact of impulsivity and sensation-seeking (linked to low conscientiousness and high extraversion) is most powerful during adolescence and young adulthood in predicting the initiation of SU [<xref ref-type="bibr" rid="ref22">22</xref>]. In later adulthood, however, traits such as neuroticism may become more salient predictors of the maintenance or escalation of SU as a chronic coping strategy for life stressors [<xref ref-type="bibr" rid="ref8">8</xref>].</p><p>Gender also shapes these pathways [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. While men have historically shown higher rates of SUDs, women often exhibit a &#x201C;telescoping&#x201D; effect&#x2014;a more rapid progression from initial use to dependence. Research suggests the link between neuroticism and coping-motivated SU is particularly strong in women, who may be more likely to use substances to self-medicate for co-occurring mood or anxiety disorders. Conversely, SU pathways related to impulsivity and social deviance (low conscientiousness and low agreeableness) appear to be more pronounced predictors for men [<xref ref-type="bibr" rid="ref12">12</xref>].</p></sec><sec id="s1-2-4"><title>Personality Assessment in the Digital Era: Social Media, Personality, and SU</title><p>Despite these well-documented associations, traditional trait-SU research has been constrained by its reliance on self-report surveys and controlled experiments. These methods, while valuable, often suffer from recall bias, social desirability effects, and a lack of ecological validity, failing to capture authentic behavioral expressions in real-world contexts. The proliferation of social media has created an unprecedented opportunity to overcome these limitations [<xref ref-type="bibr" rid="ref25">25</xref>]. Platforms such as Twitter serve as vast, naturalistic archives of human thought and behavior where individuals openly discuss their experiences, including SU.</p><p>The emerging field of digital phenotyping leverages computational methods, particularly natural language processing (NLP), to infer psychological traits and monitor health behaviors from user-generated digital footprints [<xref ref-type="bibr" rid="ref26">26</xref>]. Recent studies have successfully demonstrated the power of these approaches in capturing nuanced behavioral and personality patterns: AI-based analysis of social media language can predict SY treatment outcomes [<xref ref-type="bibr" rid="ref27">27</xref>], while cognition-aware digital phenotyping frameworks provide fine-grained monitoring of SU behaviors in real-time [<xref ref-type="bibr" rid="ref28">28</xref>]. Moreover, digital phenotyping is increasingly recognized as a transformative tool in psychiatry, offering data-driven insights into mental health, including SU risk, and facilitating ecologically valid assessments of personality-SU interactions [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref29">29</xref>].</p><p>This methodology allows researchers to study the personality-SU link at a massive scale, with temporal precision, and within the authentic context of users&#x2019; daily lives, providing a powerful complement to traditional approaches. However, the application of these methods to examine how a global stressor such as the COVID-19 pandemic reshaped the public discourse around personality and SU remains a significant and underexplored frontier.</p><p>This study addresses these research gaps by applying advanced computational methods to a massive longitudinal dataset of 1.13 billion tweets spanning the prepandemic and pandemic periods (2019&#x2010;2021). By leveraging deep learning-based personality inference and state-of-the-art topic and emotion modeling, we provide a multidimensional examination of how personality traits manifested in natural SU discourse. Our study aims to make 3 primary contributions: first, to establish the utility of large-scale social media data for studying personality-SU relationships in ecologically valid contexts; second, to reveal how the crisis conditions of the COVID-19 pandemic modified these associations; and third, to demonstrate the value of computational methods for identifying at-risk populations and informing targeted public health interventions. To achieve these aims, this study is guided by the following research questions (RQs) in <xref ref-type="other" rid="box2">Textbox 2</xref>.</p><boxed-text id="box2"><title> . Research questions (RQ).</title><p>RQ1: longitudinal variation: did the linguistic expression of Big Five personality traits within substance use (SU)-related discourse on Twitter (subsequently rebranded X; X Corp) exhibit significant variation between the prepandemic (2019) and pandemic (2020-2021) periods?</p><p>RQ2: predictive analysis: to what extent do the Big Five personality traits predict SU classification among individuals on the platform Twitter during the unique socioenvironmental context of the COVID-19 pandemic?</p><p>RQ3: emotional expression: how did the emotional tone of SU-related discourse vary across individuals with different dominant personality traits throughout the pandemic?</p><p>RQ4: substance specificity: what were the associations between inferred personality traits and discourse related to specific substance types (eg, alcohol, cannabis, or opioids)?</p><p>RQ5: demographic dimensions: how did the relationships between personality and SU discourse differ across key demographic factors, specifically age and gender?</p><p>RQ6: thematic content: what were the prevailing topics within SU discourse, and how did these themes differ across the 5 major personality traits during the pandemic?</p></boxed-text></sec></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview</title><p>The methodology for this study is systematically organized into 4 stages, as depicted in <xref ref-type="fig" rid="figure1">Figure 1</xref>. This section details each stage, beginning with the construction of the SU data corpus (step 1), followed by the parallel extraction of demographic or emotional attributes (step 2) and personality traits (step 3). These streams converge into the final stage, a comprehensive statistical analysis (step 4), designed to address the study&#x2019;s RQs. The reporting of this observational study adhered to the STROBE (Strengthening the Reporting of Observational Studies in Epidemiology) guidelines [<xref ref-type="bibr" rid="ref30">30</xref>], and a completed STROBE checklist detailing the study design and methods is provided in <xref ref-type="supplementary-material" rid="app1">Checklist 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Overview of research work. SU: substance use.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e79454_fig01.png"/></fig></sec><sec id="s2-2"><title>Data Acquisition and SU Identification (Step 1)</title><p>The foundation of this study is a large-scale data corpus constructed from the Internet Archive&#x2019;s public Twitter stream [<xref ref-type="bibr" rid="ref31">31</xref>], spanning January 1, 2019, to December 31, 2021. This 3-year period provides a critical prepandemic baseline (2019) for comparison against the pandemic&#x2019;s subsequent phases (2020&#x2010;2021).</p><p>The process began with data collection and extensive data preprocessing. We filtered the raw data to retain US-based, original posts (excluding retweets), tweets shorter than 5 words, and applied a rigorous cleaning pipeline using the Natural Language Toolkit. This involved converting text to lowercase, removing punctuation, stop words, URLs, and user mentions, and performing lemmatization to standardize words to their base forms (eg, &#x201C;drinking&#x201D; to &#x201C;drink&#x201D;).</p><p>The cleaned corpus of 1.13 billion posts was then processed for SU identification. We used a deep learning classifier from our prior work [<xref ref-type="bibr" rid="ref32">32</xref>], which uses a RoBERTa [<xref ref-type="bibr" rid="ref32">32</xref>] architecture to identify SU-related discourse with 80% accuracy. This step yielded the final SU data corpus of approximately 9 million posts. As the final part of this stage, we further classified these posts into 10 substance types based on the National Institute on Drug Abuse&#x2019;s pharmacological categories [<xref ref-type="bibr" rid="ref33">33</xref>] (alcohol, tobacco, cannabinoids, stimulants, opioids, hallucinogens, club drugs, dissociative drugs, other compounds, and prescription medication) using standard keywords formulated by National Institute on Drug Abuse. For instance, the post is identified as tobacco only if keywords associated with either one of cigarettes, vapor cigarettes, cigars, chewing tobacco, and snuff are present in the post. These subcategories of classification ensured the foundational data for all subsequent analyses.</p></sec><sec id="s2-3"><title>Demographic and Emotional Feature Extraction (Step 2)</title><p>Taking the 9 million post SU data corpus as input, this stage focused on extracting user-level demographic and post level emotional attributes [<xref ref-type="bibr" rid="ref34">34</xref>].</p></sec><sec id="s2-4"><title>Demographic Extraction</title><p>We inferred user age and gender using the M3-Inference model [<xref ref-type="bibr" rid="ref35">35</xref>], an open-source system that analyzes textual features from user profiles (username, screen name, and description). As validated against ground-truth profiles, the model achieved high accuracy for the gender (95%) and age (89%) classification. Age was categorized into 4 groups (&#x2264;18, 19&#x2010;29, 30&#x2010;39, and &#x2265;40 years).</p></sec><sec id="s2-5"><title>Emotion and Sentiment Extraction</title><p>We analyzed the emotional content of each post using 2 tools. Multi-label emotion recognition was performed using SpanEmo [<xref ref-type="bibr" rid="ref36">36</xref>], a BERT-based model that classifies text into 1 of 7 key emotions (fear, joy, negative, positive, sadness, surprise, and trust). For overall sentiment, we used VADER [<xref ref-type="bibr" rid="ref37">37</xref>], a lexicon-based tool that calculates a single compound score ranging from &#x2212;1 (most negative) to +1 (most positive).</p></sec><sec id="s2-6"><title>Big Five Personality Traits Identification (Step 3)</title><p>We derived users&#x2019; Big Five personality traits (openness, conscientiousness, extraversion, agreeableness, and neuroticism) from their social media posts using our validated deep learning model [<xref ref-type="bibr" rid="ref38">38</xref>]. The model was trained on a Reddit dataset, PANDORA [<xref ref-type="bibr" rid="ref39">39</xref>] comprising 1 million posts with professionally labeled Big Five personality scores. Our architecture used large language model embeddings (RoBERTa [<xref ref-type="bibr" rid="ref40">40</xref>]) trained on a bidirectional long short-term memory network to build the personality trait classifier. Essentially, we build 5 classifiers for each trait in which we achieved an average of area under the receiver operating characteristic curve=0.8 across all traits. The performance of the classifier on each trait was 0.82 for openness, 0.81 for conscientiousness, 0.80 for extraversion, 0.83 for agreeableness, and 0.81 for neuroticism. Using an 8:1:1 data split for training, validation, and testing, the model achieved robust performance in personality trait prediction. As both training and application data consisted of social media content (Reddit and Twitter, respectively), we applied this model to estimate personality scores (range: 0&#x2010;1) for all SU-related posts in our dataset. This approach allowed for scalable personality assessment while maintaining consistency with established psychological measurement frameworks.</p></sec><sec id="s2-7"><title>Comprehensive Analysis (Step 4)</title><sec id="s2-7-1"><title>Trend Analysis</title><p>To explore temporal patterns in personality traits in SU discourse, we conducted a trend analysis examining the mean and SD of the continuous personality score (0 to 1) over the 3 years. The trend was further stratified by the age and gender variables.</p></sec><sec id="s2-7-2"><title>Multilevel Logistic Regression</title><p>To examine temporal trends in the associations between Big Five personality traits and substance-related posts, we conducted logistic regression on the 2020 corpus. Standardized trait scores (mean 0, SD 1) were used as predictors, with substance types (binary: 0/1) as the outcome. Odds ratios (ORs) and 95% CIs were computed to quantify the strength and uncertainty of these associations. To visualize relational patterns, we plotted ORs with connecting lines, enabling clear comparison between multiple substances for a specific trait. Error bars represent 95% CIs, and a reference line at OR 1 indicates no effect. This approach allows for robust assessment of trait-specific substance patterns in social media discourse.</p></sec><sec id="s2-7-3"><title>Biserial Correlation Analysis</title><p>The point-biserial correlation [<xref ref-type="bibr" rid="ref41">41</xref>] is a special case of Pearson correlation used when 1 variable is dichotomous, and the other is continuous. It measures the relationship between a dichotomous (binary) variable and a continuous variable. In our study, we used it to determine the correlation between binary-valued substance type and a continuous Big Five personality score.</p></sec><sec id="s2-7-4"><title>BERTopic Modeling</title><p>We implemented BERTopic [<xref ref-type="bibr" rid="ref42">42</xref>] modeling to analyze SU discourse patterns across different personality traits, using a multistage pipeline that combined transformer-based embeddings with hierarchical clustering. The text was first encoded into 384-dimensional semantic vectors using SentenceTransformer&#x2019;s &#x201C;all-MiniLM-L6-v2&#x201D; model, followed by UMAP (Uniform Manifold Approximation and Projection) dimensionality reduction (n_components=3, cosine metric) and HDBSCAN (Hierarchical Density-Based Spatial Clustering of Applications With Noise) clustering (min_cluster_size=50) to identify distinct topics. For topic representation, we used a hybrid approach incorporating KeyBERT for keyword extraction, Maximal Marginal Relevance (diversity=0.3) for term selection, and GPT-3.5 turbo for generating personality-specific topic labels through customized prompts. The custom prompt is presented in <xref ref-type="other" rid="box3">Textbox 3</xref>. While traditional topic models can identify clusters of semantically related words, their labels are often limited, ambiguous, or fail to capture subtle contextual nuances. GPT, in contrast, leverages deep contextual understanding to generate highly interpretable, human-readable, and personality-sensitive topic descriptors. This allows the model to capture the social, emotional, and behavioral subtleties embedded in SU discourse, providing richer and more actionable insights than conventional labeling methods.</p><boxed-text id="box3"><title> . Large language model prompt for topic labeling.</title><p>Prompt = """I have topic that contains the following documents: \n[DOCUMENTS]The topic is described by the following keywords: [KEYWORDS]Based on the above information, can you give a short label of the topic?"""</p></boxed-text><p>The model incorporated n-gram processing (1&#x2010;2 g) and filtered social media-specific stopwords while leveraging GPU acceleration for efficient computation, providing an optimized balance between semantic granularity and analytical efficiency for psychological text analysis.</p></sec></sec><sec id="s2-8"><title>Ethical Considerations</title><p>This study was conducted in accordance with strict ethical protocols. The data was sourced exclusively from the publicly available Internet Archive, containing no private information. There was no exclusive participation accounted for in this research; hence, no compensation was made. A rigorous deidentification process, including the removal of user IDs and the preprocessing of post content, was implemented to ensure user anonymity. All findings are reported in aggregate to prevent the identification of individuals. To further mitigate ethical risks, this study framed its analyses to emphasize population-level insights, carefully contextualizing the associations between personality traits and SU behaviors to prevent misinterpretation or misuse in real-world applications. These measures were implemented throughout the research process to ensure responsible handling of potentially sensitive behavioral data.</p><p>Beyond these procedural safeguards, it is important to reflect on the ethical implications of inferring sensitive traits such as age, gender, personality, and SU behaviors without explicit consent, even from public data. Our analyses were intentionally designed to avoid individual-level profiling, prioritize transparency in modeling methods, and interpret findings at the population level. By acknowledging these concerns, we aim to promote the responsible, ethically informed use of computational social science methods and digital phenotyping in public health research.</p><p>This research was supported by the Substance Abuse and Mental Health Services Administration Strategic Prevention Framework-19 (grant 6H79SP081502) and was approved by the Institutional Review Board at Kent State University (IRB20-182).</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Descriptive and Trend Analysis in Personality Traits</title><p>This section presents the findings on the relationship between 5 major personality traits and SU trends observed annually from 2019 to 2021. For the identified SU posts (2,799,726 in 2019, 3,502,171 in 2020, and 2,553,235 in 2021) from our previous work [<xref ref-type="bibr" rid="ref32">32</xref>], first, we predicted the score across each personality trait in a scale of 0 to 1 using our custom deep learning model [<xref ref-type="bibr" rid="ref38">38</xref>]. The data, including mean scores, SDs, and effect sizes for year-over-year changes, are summarized in <xref ref-type="table" rid="table1">Table 1</xref>. The analysis reveals distinct patterns for each personality trait, with notable shifts occurring particularly in the year 2020, a period marked by the onset of the global COVID-19 pandemic.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Personality traits and substance use trends (2019&#x2010;2021).</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Trait</td><td align="left" valign="bottom">2019, mean (SD)</td><td align="left" valign="bottom">2020, mean (SD)</td><td align="left" valign="bottom">2021, mean (SD)</td><td align="left" valign="bottom">Trend interpretation<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top">Openness</td><td align="left" valign="top">0.47 (0.15)</td><td align="left" valign="top">0.49 (0.15)</td><td align="left" valign="top">0.47 (0.15)</td><td align="left" valign="top">&#x2191; in 2020 (<italic>d</italic>=0.13), then stabilized</td></tr><tr><td align="left" valign="top">Conscientiousness</td><td align="left" valign="top">0.69 (0.13)</td><td align="left" valign="top">0.71 (0.12)</td><td align="left" valign="top">0.70 (0.13)</td><td align="left" valign="top">&#x2191; in 2020 (<italic>d</italic>=0.15), slight &#x2193; in 2021</td></tr><tr><td align="left" valign="top">Agreeableness</td><td align="left" valign="top">0.38 (0.14)</td><td align="left" valign="top">0.39 (0.13)</td><td align="left" valign="top">0.39 (0.13)</td><td align="left" valign="top">Small &#x2191; in 2020 (<italic>d</italic>=0.07)</td></tr><tr><td align="left" valign="top">Neuroticism</td><td align="left" valign="top">0.63 (0.15)</td><td align="left" valign="top">0.61 (0.15)</td><td align="left" valign="top">0.61 (0.15)</td><td align="left" valign="top">&#x2193; in 2020 (<italic>d</italic>=&#x2212;0.13), contrary to expected pandemic stress effects</td></tr><tr><td align="left" valign="top">Extraversion</td><td align="left" valign="top">0.53 (0.14)</td><td align="left" valign="top">0.53 (0.14)</td><td align="left" valign="top">0.53 (0.14)</td><td align="left" valign="top">No change (<italic>P</italic>&#x2265;.99)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>Cohen <italic>d</italic> values (0.07-0.15) indicate effect size for the change from the previous year.</p></fn></table-wrap-foot></table-wrap><p>An examination of the data presented reveals distinct patterns for each personality trait across the 3 years. For openness, the association with SU showed a fluctuation. It initially stood at mean 0.47 (SD 0.15) in 2019, then increased in 2020 to mean 0.497 (SD 0.15). This rise represented a small effect size (d=0.13). Subsequently, in 2021, the association returned to its 2019 level of mean 0.47 (SD 0.15), indicating a stabilization. The association between conscientiousness and SU also shifted during this period. Starting at mean 0.69 (SD 0.13) in 2019, it increased to mean 0.71 (SD 0.12) in 2020, a change reflecting a small effect size (d=0.15). In 2021, there was a slight decrease in this association to mean 0.70 (SD 0.13). Agreeableness demonstrated a minor change in its association with SU. The mean was 0.38 (SD 0.14) in 2019 and saw a small increase to mean 0.39 (SD 0.13) in 2020, with a negligible effect size (d=0.07). This slightly elevated association remained constant in 2021, with a mean of 0.39 (SD 0.13). A notable trend was observed for neuroticism. Its association with SU was a mean of 0.63 (SD 0.15) in 2019. Contrary to what might be expected under pandemic-related stress, this association slightly decreased to 0.61 (SD 0.15) in 2020, a change with a small negative effect size (d=&#x2212;0.13). The association then remained stable at this level in 2021. Finally, the association between extraversion and SU exhibited considerable stability. The mean association was 0.53 (SD 0.14) in 2019 and remained unchanged in both 2020, mean 0.53 (SD 0.14) and 2021, mean 0.53 (SD 0.14), with the analysis indicating no significant change (<italic>P&#x2265;</italic>.99). In summary, the results indicate that while the association of extraversion with SU remained constant, openness, conscientiousness, agreeableness, and neuroticism showed varying degrees of change in their associations with SU between 2019 and 2021, with the most pronounced shifts occurring in 2020.</p></sec><sec id="s3-2"><title>Personality Traits as Predictors of SU</title><p>To investigate the relationship between personality and SU, we first examined the distributional differences in the Big Five personality scores between the SU and nonsubstance user groups on a sample corpus of 133,374. As illustrated in <xref ref-type="fig" rid="figure2">Figure 2</xref>, a visual inspection of the data reveals distinct patterns. The distributions for extraversion and agreeableness are visibly shifted higher for the SU group, while the distribution for neuroticism is shifted lower. In contrast, the distributions for openness and conscientiousness appear largely similar between the 2 groups.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Distribution of the Big Five personality trait scores for nonsubstance user and substance user groups.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e79454_fig02.png"/></fig><p>To formally test these observed differences and determine the unique contribution of each trait, we conducted a multiple logistic regression analysis on a balanced sample of 133,374 corpus (n=66,687 per group). The analysis used the dichotomous SU classification as the dependent variable, with the 5 continuous personality scores as independent variables. The overall model was statistically significant, indicating that personality traits reliably distinguished between the 2 groups. The OR and 95% CIs from the model are presented in <xref ref-type="fig" rid="figure3">Figure 3</xref>.</p><p>The analysis identified 3 statistically significant predictors. Agreeableness demonstrated a strong positive association with SU (OR 4.04, 95% CI 3.71-4.41, <italic>P</italic>&#x003C;.001). Extraversion also emerged as a robust positive predictor (OR 3.22, 95% CI 2.98-3.49, <italic>P</italic>&#x003C;.001). In contrast, a significant negative relationship was observed for neuroticism (OR 0.29, 95% CI 0.26-0.31, <italic>P</italic>&#x003C;.001).</p><p>Neither conscientiousness (OR 0.91, 95% CI 0.83-1.00, <italic>P</italic>=.055) nor openness (OR 0.97, 95% CI 0.89-1.05, <italic>P</italic>=.42) was found to be a statistically significant predictor in the final model, although the association for conscientiousness approached statistical significance.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Log odds ratios of personality traits on substance use.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e79454_fig03.png"/></fig></sec><sec id="s3-3"><title>Emotion Association in Personality Traits</title><p>To explore the relationship between personality and emotional expression, a biserial correlation analysis was performed on a 2020 corpus of SU-related online posts. The analysis compared 5 personality traits against 7 emotion categories: namely, fear, joy, negative, positive, sadness, surprise, and trust, yielding generally weak to modest correlations, with absolute coefficient values ranging from 0.00 to 0.09, as detailed in <xref ref-type="fig" rid="figure4">Figure 4</xref>.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Heatmap correlation between personality traits and emotion markers. AGR: agreeableness; CON: conscientiousness; EXT: extraversion; NEU: neuroticism; OPN: openness.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e79454_fig04.png"/></fig><p>The findings indicated distinct emotional patterns for certain traits. Agreeableness showed the strongest positive association with positive emotionality, correlating most highly with joy (<italic>r</italic>=.09) and positive emotions (<italic>r</italic>=.06). In contrast, conscientiousness was linked to negative valence emotions, showing positive correlations with fear (<italic>r</italic>=.08) and sadness (<italic>r</italic>=.06). A counterintuitive pattern was observed for neuroticism, which was negatively correlated with the expression of negative emotions (<italic>r</italic>=&#x2212;.08), fear (<italic>r</italic>=&#x2212;.07), and sadness (<italic>r</italic>=&#x2212;.06). Correlations for extraversion and openness were weaker and less distinct across all emotion categories.</p></sec><sec id="s3-4"><title>Personality Traits as Predictors of Various Substance Types</title><p>Multilevel logistic regression analyses were conducted to investigate the association between 5 core personality traits (openness, conscientiousness, extraversion, agreeableness, and neuroticism) and the likelihood of using various types of substances in the 2020 corpus. The findings for each personality trait are detailed below, referencing the estimated log ORs (coefficients) and their 95% CIs.</p></sec><sec id="s3-5"><title>Openness</title><p>As shown in <xref ref-type="fig" rid="figure5">Figure 5</xref>, openness demonstrated several significant associations with SU. Higher levels of openness were significantly associated with an increased likelihood of using alcohol, with a coefficient of approximately 0.014, and cannabinoids, with a coefficient of approximately 0.010. A similar positive association was found with stimulants, yielding a coefficient of approximately 0.005. Furthermore, openness was significantly associated with an increased likelihood of tobacco use (coefficient&#x2248;0.0005), opioid use (coefficient&#x2248;0.001), dissociative drug use (coefficient&#x2248;0.001), the use of other compounds (coefficient&#x2248;0.001), and the use of prescription medications (coefficient&#x2248;0.0005). For all these latter substances, the effect sizes indicated a slightly increased likelihood. In contrast, nonsignificant associations were observed between openness and the use of club drugs and hallucinogens.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Log odds ratios (and 95% CIs) for the association between openness and various substance types.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e79454_fig05.png"/></fig></sec><sec id="s3-6"><title>Conscientiousness</title><p><xref ref-type="fig" rid="figure6">Figure 6</xref> illustrates the relationship between conscientiousness and SU. Higher conscientiousness was significantly associated with a decreased likelihood of using alcohol, indicated by a coefficient of approximately &#x2212;0.011. Similarly, increased conscientiousness was linked to a reduced probability of using cannabinoids (coefficient&#x2248;&#x2212;0.008) and stimulants (coefficient&#x2248;&#x2212;0.003). Conversely, a somewhat counterintuitive finding was that higher conscientiousness was significantly associated with a slightly increased likelihood of using opioids (coefficient&#x2248;0.001) and other compounds (coefficient&#x2248;0.0005). There were no significant associations found between conscientiousness and the use of tobacco, club drugs, dissociative drugs, hallucinogens, or prescription medications.</p><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>Log odds ratios (and 95% CIs) for the association between conscientiousness and various substance types.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e79454_fig06.png"/></fig></sec><sec id="s3-7"><title>Extraversion</title><p>Extraversion showed widespread significant positive associations with SU, as depicted in <xref ref-type="fig" rid="figure7">Figure 7</xref>. A higher degree of extraversion was significantly associated with an increased likelihood of using cannabinoids, which showed the largest effect size for this trait (coefficient&#x2248;0.031). Positive associations were also found for alcohol (coefficient&#x2248;0.017), stimulants (coefficient&#x2248;0.009), and tobacco (coefficient&#x2248;0.006). Additionally, higher extraversion was linked to an increased likelihood of using opioids (coefficient&#x2248;0.002), hallucinogens (coefficient&#x2248;0.002), other compounds (coefficient&#x2248;0.002), and prescription medications (coefficient&#x2248;0.001). Nonsignificant associations were observed between extraversion and the use of club drugs and dissociative drugs.</p><fig position="float" id="figure7"><label>Figure 7.</label><caption><p>Log odds ratios (and 95% CIs) for the association between extraversion and various substance types.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e79454_fig07.png"/></fig></sec><sec id="s3-8"><title>Agreeableness</title><p>The associations between agreeableness and SU are presented in <xref ref-type="fig" rid="figure8">Figure 8</xref>. Higher agreeableness was significantly associated with a decreased likelihood of using cannabinoids, with a coefficient of approximately &#x2212;0.012, and tobacco, with a coefficient of approximately &#x2212;0.008. Intriguingly, higher agreeableness was also significantly associated with an increased likelihood of using several substances. The most notable positive association was with alcohol (coefficient&#x2248;0.023). Furthermore, increased agreeableness was linked to a higher probability of using opioids (coefficient&#x2248;0.003), stimulants (coefficient&#x2248;0.002), club drugs (coefficient&#x2248;0.001), hallucinogens (coefficient&#x2248;0.001), and other compounds (coefficient&#x2248;0.001). No significant associations were found between agreeableness and the use of dissociative drugs or prescription medications.</p><fig position="float" id="figure8"><label>Figure 8.</label><caption><p>Log odds ratios (and 95% CIs) for the association between agreeableness and various substance types.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e79454_fig08.png"/></fig></sec><sec id="s3-9"><title>Neuroticism</title><p><xref ref-type="fig" rid="figure9">Figure 9</xref> displays the results for neuroticism. Higher neuroticism was significantly associated with an increased likelihood of using alcohol, with a coefficient of approximately 0.020. Positive associations, though smaller in magnitude, were also observed for hallucinogens (coefficient&#x2248;0.001) and other compounds (coefficient&#x2248;0.001). A very small but statistically significant positive association was also noted with prescription medications (coefficient near 0). Conversely, higher neuroticism was significantly associated with a decreased likelihood of using several other substances. The strongest negative association was with cannabinoids (coefficient&#x2248;&#x2212;0.030). Other significant negative associations were found for stimulants (coefficient&#x2248;&#x2212;0.007), tobacco (coefficient&#x2248;&#x2212;0.005), and opioids (coefficient&#x2248;&#x2212;0.004). Nonsignificant associations were found between neuroticism and the use of club drugs and dissociative drugs.</p><fig position="float" id="figure9"><label>Figure 9.</label><caption><p>Log odds ratios (and 95% CIs) for the association between neuroticism and various substance types.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e79454_fig09.png"/></fig></sec><sec id="s3-10"><title>Personality Traits Association With Age and Gender</title><p>This section details the findings from a multilevel logistic analysis examining the interaction between personality traits and demographic factors (age group and sex) in relation to SU. The results are presented as ORs with 95% CIs. An OR greater than 1.00 indicates that a personality trait&#x2019;s association with SU is stronger (or less protective) in the index group (teenagers or females) compared to the reference group (adults or males). Conversely, an OR less than 1.00 suggests the trait&#x2019;s association is weaker (or more protective) in the index group. All reported effects are statistically significant, as indicated by CIs not crossing 1.00, owing in part to the large sample sizes.</p><p>To better capture demographic-specific patterns and potential nonlinear effects of age and sex on personality-SU associations, we stratified the analyses by age group and gender rather than including these variables solely as covariates. This stratification enables a clearer depiction of how personality traits influence SU discourse within distinct subgroups, highlighting developmental and sex-specific variations that might be obscured in aggregate models.</p></sec><sec id="s3-11"><title>Personality Traits and SU: Teenagers Versus Adults</title><p><xref ref-type="fig" rid="figure10">Figure 10</xref> illustrates the differential association of personality traits with SU in teenagers (n=849,510) compared to adults (n=1,257,705). The association between openness and SU was found to be significantly stronger among teenagers than adults (OR 1.04, 95% CI 1.04-1.04). Similarly, extraversion&#x2019;s association with SU was slightly stronger in teenagers compared to adults (OR 1.01, 95% CI 1.01-1.01). In contrast, the association of agreeableness with SU, which is typically protective, was found to be slightly more pronounced (more protective) in teenagers relative to adults (OR 0.99, 95% CI 0.98-0.99). Conscientiousness, generally a protective trait, exhibited a significantly weaker protective association with SU in teenagers when compared to adults (OR 1.03, 95% CI 1.03-1.04), suggesting that the protective effect of conscientiousness against SU is attenuated in adolescence. Finally, the association of neuroticism with SU, typically a risk factor, was found to be slightly weaker in teenagers compared to adults (OR 0.98, 95% CI 0.98-0.98).</p><fig position="float" id="figure10"><label>Figure 10.</label><caption><p>Personality traits associated with teenagers&#x2019; substance use versus adults&#x2019; substance use. AGR: agreeableness; CON: conscientiousness; EXT: extraversion; NEU: neuroticism; OPN: openness.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e79454_fig10.png"/></fig></sec><sec id="s3-12"><title>Personality Traits and SU: Females Versus Males</title><p><xref ref-type="fig" rid="figure11">Figure 11</xref> presents the differential association of personality traits with SU in females (n=1,653,265) compared to males (n=1,558,727). The protective association of conscientiousness with SU was slightly stronger in females than in males (OR 0.99, 95% CI 0.99-1.00). Extraversion&#x2019;s association with SU was weaker among females compared to males (OR 0.98, 95% CI 0.98-0.99), and the association of openness with SU was also weaker in females relative to males (OR 0.96, 95% CI 0.95-0.96). Agreeableness demonstrated a substantially stronger protective association with SU in females compared to males (OR 0.92, 95% CI 0.91-0.92). Lastly, neuroticism&#x2019;s association as a risk factor for SU was weaker in females compared to males (OR 0.97, 95% CI 0.97-0.97).</p><fig position="float" id="figure11"><label>Figure 11.</label><caption><p>Personality traits associated with male substance use versus female substance use. AGR: agreeableness; CON: conscientiousness; EXT: extraversion; NEU: neuroticism; OPN: openness.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e79454_fig11.png"/></fig></sec><sec id="s3-13"><title>Topic Analysis</title><p>This section presents key themes or topics discussed within each personality trait in SU discourse. We conducted the BERTopic analysis to identify thematic clusters within a corpus of documents from 2020 related to personality traits and SU. The analysis was performed separately for documents associated with each of the Big Five personality traits. For each trait, the most prominent topics, their corresponding document counts, and their proportion relative to the total documents for that trait are reported in <xref ref-type="table" rid="table2">Table 2</xref>.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>BERTopic analysis result.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Topic</td><td align="left" valign="bottom">OpenAI label</td><td align="left" valign="bottom">Document, n (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Openness</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0</td><td align="left" valign="top">Openness to nightlife enjoyment</td><td align="left" valign="top">134,265 (54.42)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">Openness to addiction</td><td align="left" valign="top">92,386 (37.45)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">Political negligence</td><td align="left" valign="top">8246 (3.34)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">Public health opinions</td><td align="left" valign="top">3100 (1.26)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4</td><td align="left" valign="top">Change in supply and distribution</td><td align="left" valign="top">2898 (1.17)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>5</td><td align="left" valign="top">Innovative service improvements</td><td align="left" valign="top">2626 (1.06)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>6</td><td align="left" valign="top">Political retrograde</td><td align="left" valign="top">1963 (0.8)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>7</td><td align="left" valign="top">Stress drinking</td><td align="left" valign="top">1077 (0.44)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>8</td><td align="left" valign="top">Embracing normalization</td><td align="left" valign="top">74 (0.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>9</td><td align="left" valign="top">Embracing fully</td><td align="left" valign="top">62 (0.3)</td></tr><tr><td align="left" valign="top">Conscientiousness</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0</td><td align="left" valign="top">Responsible drinking habits</td><td align="left" valign="top">149,860 (52.78)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">Responsible smoking habits</td><td align="left" valign="top">124,349 (43.80)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">Political retrograde and study</td><td align="left" valign="top">3641 (1.28)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">Homeless advocacy efforts</td><td align="left" valign="top">1398 (0.49)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4</td><td align="left" valign="top">Contract liquidation assessment</td><td align="left" valign="top">1316 (0.46)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>5</td><td align="left" valign="top">Consistent technology upgrades</td><td align="left" valign="top">1103 (0.39)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>6</td><td align="left" valign="top">Climate change impact analysis</td><td align="left" valign="top">969 (0.34)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>7</td><td align="left" valign="top">Maine senator Susan Collins</td><td align="left" valign="top">850 (0.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>8</td><td align="left" valign="top">Religious attributes</td><td align="left" valign="top">353 (0.12)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>9</td><td align="left" valign="top">Organized and responsible mindset</td><td align="left" valign="top">91 (0.03)</td></tr><tr><td align="left" valign="top">Extraversion</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0</td><td align="left" valign="top">Social drinking behavior</td><td align="left" valign="top">150,361 (48.46)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">Social smoking habits</td><td align="left" valign="top">140,837 (45.40)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">Political events</td><td align="left" valign="top">13,560 (4.37)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">School discussion</td><td align="left" valign="top">2571 (0.83)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4</td><td align="left" valign="top">Cancellation and bankruptcy</td><td align="left" valign="top">1143 (0.37)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>5</td><td align="left" valign="top">Normalize the change</td><td align="left" valign="top">1064 (0.34)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>6</td><td align="left" valign="top">Discussion about deaths</td><td align="left" valign="top">303 (0.1)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>7</td><td align="left" valign="top">Energetic socialization behavior</td><td align="left" valign="top">232 (0.07)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>8</td><td align="left" valign="top">Normalize social interaction</td><td align="left" valign="top">118 (0.04)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>9</td><td align="left" valign="top">Outgoing enthusiast</td><td align="left" valign="top">56 (0.02)</td></tr><tr><td align="left" valign="top">Agreeableness</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0</td><td align="left" valign="top">Friendly beverage choices</td><td align="left" valign="top">136,175 (54.48)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">Social drinking habits</td><td align="left" valign="top">99,238 (39.70)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">Nobody protests peacefully, agitated</td><td align="left" valign="top">6852 (2.74)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">Changes in supply and distribution</td><td align="left" valign="top">2894 (1.16)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4</td><td align="left" valign="top">Employee and contracts</td><td align="left" valign="top">2278 (0.91)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>5</td><td align="left" valign="top">School and eligible discussion</td><td align="left" valign="top">1191 (0.48)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>6</td><td align="left" valign="top">Normalize the change</td><td align="left" valign="top">558 (0.22)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>7</td><td align="left" valign="top">Weather demands</td><td align="left" valign="top">442 (0.18)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>8</td><td align="left" valign="top">Gentle pain relief</td><td align="left" valign="top">292 (0.12)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>9</td><td align="left" valign="top">Harmony discussion</td><td align="left" valign="top">53 (0.02)</td></tr><tr><td align="left" valign="top">Neuroticism</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0</td><td align="left" valign="top">Emotionally turbulent drinking habits</td><td align="left" valign="top">123,209 (50.05)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">Drink and anxiety association</td><td align="left" valign="top">95,229 (38.69)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">Anxiety during the COVID pandemic</td><td align="left" valign="top">10,570 (4.29)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">Contract liquidation and upgrade</td><td align="left" valign="top">8186 (3.33)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4</td><td align="left" valign="top">Political tension</td><td align="left" valign="top">7036 (2.86)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>5</td><td align="left" valign="top">Anxious hopes</td><td align="left" valign="top">854 (0.35)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>6</td><td align="left" valign="top">Normalize the change</td><td align="left" valign="top">565 (0.23)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>7</td><td align="left" valign="top">Medications</td><td align="left" valign="top">227 (0.09)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>8</td><td align="left" valign="top">Liquid and drinks</td><td align="left" valign="top">174 (0.07)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>9</td><td align="left" valign="top">Cross-border issues</td><td align="left" valign="top">105 (0.04)</td></tr></tbody></table></table-wrap><p>A total of 246,700 documents were analyzed in relation to openness. The 2 most dominant topics identified were &#x201C;openness to nightlife enjoyment&#x201D; (topic 0) accounting for 54.42% (n=134,265) of the documents, and &#x201C;openness to addiction&#x201D; (topic 1) comprising 37.45% (n=92,386). A smaller, yet notable topic, &#x201C;stress drinking&#x201D; (topic 7), appeared in 0.44% (n=1077) of documents. Other topics, such as &#x201C;political negligence&#x201D; (n=8246, 3.34%), &#x201C;public health opinions&#x201D; (n=3100, 1.26%), and &#x201C;change in supply and distributions&#x201D; (n=2898, 1.17%), represented smaller proportions and appeared less directly related to SU behaviors per se, potentially reflecting broader contextual discussions within the dataset.</p><p>For conscientiousness, 283,930 documents were analyzed. The analysis revealed 2 primary topics: &#x201C;responsible drinking habits&#x201D; (topic 0) which constituted 52.78% (n=149,860) of the documents, and &#x201C;responsible smoking habits&#x201D; (topic 1) accounting for 43.80% (n=124,349) of them. A very small proportion was attributed to &#x201C;organized and responsible mindset&#x201D; (topic 9) at 0.03% (n=91). The remaining topics, such as &#x201C;political retrograde and study&#x201D; (n=3641, 1.28%) and &#x201C;homeless advocacy efforts&#x201D; (n=1398, 0.49%) were less prevalent and less clearly connected to individual SU patterns.</p><p>The analysis of 310,245 documents related to extraversion highlighted &#x201C;social drinking behavior&#x201D; (topic 0) as the most significant topic, with 48.46% (n=150,361) of the documents. Closely following was &#x201C;social smoking habits&#x201D; (topic 1) representing 45.40% (n=140,837). Smaller topics included &#x201C;energetic socialization behavior&#x201D; (topic 7) at 0.07% (n=232) and &#x201C;outgoing enthusiast&#x201D; (topic 9) at 0.02% (n=56). Topics such as &#x201C;political events&#x201D; (n=13,560, 4.37%) and &#x201C;school discussion&#x201D; (n=2571, 0.83%) were also present but had a less direct bearing on SU itself.</p><p>A total of 249,973 documents were analyzed for agreeableness. The most prominent topic was &#x201C;friendly beverage choices&#x201D; (topic 0) accounting for 54.48% (n=136,175) of documents. The second major topic was &#x201C;social drinking habits&#x201D; (topic 1) comprising 39.70% (n=99,238). A topic labeled &#x201C;gentle pain reliefs&#x201D; (topic 8) was found in 0.12% (n=292) of documents. Other identified topics, such as &#x201C;nobody protests peacefully, agitated&#x201D; (n=6852, 2.74%) and &#x201C;changes in supply and distributions&#x201D; (n=2894, 1.16%) were less frequent, and their connection to agreeableness in the context of SU was not immediately apparent from the labels.</p><p>For neuroticism, 246,155 documents were processed. The leading topic was &#x201C;emotionally turbulent drinking habits&#x201D; (topic 0) representing 50.05% (n=123,209) of the documents. The second significant topic was &#x201C;drink and anxiety association&#x201D; (topic 1) with 38.69% (n=95,229). Another relevant topic, &#x201C;anxiety during COVID pandemic&#x201D; (topic 2) accounted for 4.29% (n=10,570). The topic &#x201C;medications&#x201D; (topic 7) appeared in 0.09% (n=227) of documents.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>The principal finding of this research underscores the paramount importance of social-relational personality traits in predicting SU within the studied online communities.</p><p>Our analysis identifies extraversion (OR 3.22, 95% CI 2.98-3.49) and, most powerfully, agreeableness (OR 4.04, 95% CI 3.71-4.41) as the strongest positive predictors of SU. This suggests that, within this digital sphere, SU discourse is deeply embedded in social and affiliative contexts, a conclusion reinforced by topic analyses revealing prominent themes of &#x201C;social drinking behavior&#x201D; and &#x201C;friendly beverage choices.&#x201D;</p><p>In stark contrast to this socially driven pattern, and challenging long-held theoretical assumptions, our study reveals a paradoxical and robust protective effect of neuroticism. This counterintuitive finding is consistently supported across our analyses: neuroticism was strongly and negatively associated with SU classification (OR 0.29, 95% CI 0.26-0.31), its link to SU discussions diminished during the 2020 pandemic peak (d=&#x2212;0.13), and it was negatively correlated with the online expression of negative emotions (r=&#x2212;.08). This result directly opposes the traditional self-medication hypothesis, which posits that individuals use substances to cope with negative affect [<xref ref-type="bibr" rid="ref43">43</xref>]. A potential explanation lies in online expression; individuals high in neuroticism may be less inclined to participate in public substance-related discussions due to concerns over social judgment or reputational risk, even if they engage in SU offline. Moreover, negative emotions might be managed through private coping mechanisms rather than overt online disclosure, while SU-related conversations appear to attract users with social-affiliative traits, such as extraversion and agreeableness. Together, these patterns indicate that online SU discourse reflects the social and performative functions of communication, highlighting a distinction between public engagement and direct behavioral risk, and providing a nuanced understanding of personality influences in digital contexts.</p><p>Collectively, these findings suggest that in contemporary online environments, the drivers of SU discourse may pivot away from solitary emotional coping and toward functions of social connection. While the pandemic provided a salient natural context that accentuated these tendencies, it is equally plausible that these patterns reflect broader digital-era dynamics of social affiliation and positive self-expression, consistent with emerging perspectives in online health behavior [<xref ref-type="bibr" rid="ref29">29</xref>] and positive psychology.</p></sec><sec id="s4-2"><title>RQ1: Longitudinal Variation: Did the Linguistic Expression of Big Five Personality Traits in SU-Related Discourse on Twitter Exhibit Significant Longitudinal Variation Between 2019-2021, and What Was the Measurable Impact of the COVID-19 Pandemic on These Temporal Patterns?</title><p>Our longitudinal analysis confirms the COVID-19 pandemic acted as a significant catalyst, altering the linguistic expression of personality within SU discourse on Twitter. The year 2020 saw an increase in language related to openness, likely reflecting an exploration of novel coping mechanisms during a period of uncertainty [<xref ref-type="bibr" rid="ref44">44</xref>], and conscientiousness. The latter&#x2019;s increase does not suggest more SU, but rather a heightened discourse around regulation and control as conscientious individuals grappled with disrupted routines and health anxieties [<xref ref-type="bibr" rid="ref45">45</xref>].</p><p>Most critically, the linguistic markers for neuroticism significantly decreased, directly challenging the self-medication hypothesis [<xref ref-type="bibr" rid="ref43">43</xref>], which would predict a surge. This counterintuitive finding may be explained by &#x201C;affective blunting,&#x201D; where substances effectively numb distress and thus reduce its linguistic expression, or by a &#x201C;discourse displacement,&#x201D; where universal pandemic anxiety became a less specific theme to tie to SU. Meanwhile, the stability of extraversion underscores that the core function of SU discourse as a medium for social connection remained robust despite physical distancing. These findings illustrate that the pandemic did not simply amplify existing trends but fundamentally reshaped the content of online SU conversations.</p></sec><sec id="s4-3"><title>RQ2: Predictive Analysis: To What Extent Do the Big Five Personality Traits Predict SU Classification Among Individuals on Platform Twitter During the Unique Socioenvironmental Context of the COVID-19 Pandemic?</title><p>Our predictive analysis reveals a personality profile of online SU discourse that fundamentally prioritizes social-relational functions over individual distress, presenting a direct challenge to established risk models. The 2 strongest predictors for being classified as an SU were agreeableness (OR 4.04, 95% CI 3.71-4.41) and extraversion (OR 3.22, 95% CI 2.98-3.49). While the link to extraversion aligns with theories of sensation-seeking and sociability [<xref ref-type="bibr" rid="ref46">46</xref>], the powerful, positive association with agreeableness is highly novel. It starkly contrasts with a large body of literature that typically links low agreeableness to SUDs [<xref ref-type="bibr" rid="ref6">6</xref>]. This suggests that on a public platform such as Twitter, SU discourse is not an act of antagonism or noncompliance but rather a prosocial behavior, where agreeable individuals engage in communal sharing and social bonding around the topic.</p><p>Perhaps most consequentially, neuroticism emerged as a robust protective factor (OR 0.29, 95% CI 0.26-0.31). This finding directly contradicts the canonical self-medication hypothesis, which posits that individuals high in neuroticism are more likely to use substances to cope with negative affects [<xref ref-type="bibr" rid="ref43">43</xref>]. Our results indicate that on this platform, individuals exhibiting higher neuroticism are significantly less likely to be part of the SU discourse community. This does not necessarily mean they abstain from SU, but rather that their potential distress does not translate into public, online identification with such behaviors. They may use other coping mechanisms or simply separate their internal emotional state from this specific form of social performance.</p><p>The nonsignificance of openness and conscientiousness in this predictive model suggests their primary role is not in determining if one joins the SU conversation, but rather in shaping the content and framing of that conversation once engaged. Ultimately, our findings make a critical distinction: personality on platform Twitter appears to predict engagement in the socially mediated discourse of SU, a behavior that is functionally distinct from the private act of consumption itself.</p></sec><sec id="s4-4"><title>RQ3: Emotional Expression: How Did the Emotional Tone of SU-Related Discourse Vary Across Individuals With Different Dominant Personality Traits Throughout the Pandemic?</title><p>Examining emotional expression during the 2020 pandemic peak reveals how personality shapes the affective tone of SU discourse. The link between conscientiousness and emotions of fear and sadness points to a form of &#x201C;responsible anxiety,&#x201D; where discourse was imbued with legitimate concerns about health and control amidst a crisis [<xref ref-type="bibr" rid="ref45">45</xref>]. In contrast, the association of agreeableness with joy and positivity highlights its role as a &#x201C;social glue,&#x201D; with individuals likely framing SU in a positive, communal light to foster support and morale during a period of isolation.</p><p>The most telling result is the negative correlation between neuroticism and the expression of negative emotions. This provides strong support for an &#x201C;affective blunting&#x201D; or suppression hypothesis, suggesting that for these individuals, SU discourse reflects a state where negative feelings have been dampened, rather than a platform for cathartic expression. This challenges us to consider that for some, SU discussions may signify emotional regulation and suppression, not just the articulation of distress.</p></sec><sec id="s4-5"><title>RQ4: Substance Specificity: What Were the Associations Between Inferred Personality Traits and Discourse Related to Specific Substance Types?</title><p>Disaggregating SU by substance type reveals critical, personality-driven patterns. The association between neuroticism and alcohol discourse supports a specified self-medication model, where individuals turned to a legal and accessible anxiolytic to cope with pandemic-induced distress [<xref ref-type="bibr" rid="ref47">47</xref>]. This finding provides a personality-based lens on the widely reported increase in alcohol consumption during lockdowns.</p><p>Conversely, openness to experience was linked to discussions of cannabinoids and hallucinogens, consistent with the trait&#x2019;s connection to novelty-seeking [<xref ref-type="bibr" rid="ref5">5</xref>]. This discourse likely reflects a form of &#x201C;cognitive escapism&#x201D; from the monotony of confinement. Finally, extraversion remained tied to socially contextualized substances such as alcohol and cannabis, with discourse focused on adapting social rituals to a virtual environment. These findings confirm that motivations for use are codetermined by personality and substance, necessitating targeted, rather than generic, public health messaging.</p></sec><sec id="s4-6"><title>RQ5: Demographic Dimensions: How Did the Relationships Between Personality and SU Discourse Differ Across Key Demographic Factors, Specifically Age and Gender?</title><p>Our findings confirm that age and sex are crucial moderators of personality&#x2019;s influence on SU discourse. In adolescence, the observed patterns, such as a diminished protective effect of conscientiousness and amplified influence of extraversion, align with developmental neuroscience models of a maturing prefrontal cortex and a hypersensitive social reward system. This highlights a unique developmental window of personality-based risk and resilience.</p><p>Furthermore, we identified significant sex differences. The stronger protective effects of agreeableness and conscientiousness in females align with established gender differences in personality and risk-aversion [<xref ref-type="bibr" rid="ref24">24</xref>]. Critically, risk-associated traits such as neuroticism and extraversion had weaker associations with SU discourse in females, suggesting different, possibly more internalizing or relational, pathways to SU. These results underscore the necessity of moving beyond monolithic models of risk to develop intersectional, demographic-specific prevention strategies.</p></sec><sec id="s4-7"><title>RQ6: Thematic Content: What Were the Prevailing Topics Within SU Discourse, and How Did These Themes Differ Across the Five Major Personality Traits During the Pandemic?</title><sec id="s4-7-1"><title>Overview</title><p>The topic analysis revealed distinct &#x201C;narrative frameworks&#x201D; for SU that are patterned by personality, providing a clear basis for tailored public health interventions. The discourse of neuroticism centered on &#x201C;emotional coping,&#x201D; suggesting that messaging for this group should focus on alternative emotional regulation strategies [<xref ref-type="bibr" rid="ref48">48</xref>]. In contrast, the extraversion and agreeableness narratives focused on &#x201C;social facilitation,&#x201D; indicating a need for interventions that target harm reduction in social settings and promote nonsubstance-based social activities.</p><p>The dual themes of &#x201C;sensation-seeking&#x201D; and &#x201C;addiction awareness&#x201D; for openness highlight a user base receptive to sophisticated, fact-based harm reduction information. Finally, the conscientiousness discourse on &#x201C;controlled behavior&#x201D; suggests this group would be responsive to tools for self-monitoring and goal-setting. By identifying these personality-specific discursive fingerprints, we can move beyond one-size-fits-all campaigns to develop more resonant and effective public health communications in the digital age.</p></sec><sec id="s4-7-2"><title>Theoretical and Practical Implications</title><p>The implications of this social-centric model are significant for both theory and practice. Our findings demand that researchers distinguish between the private act of substance consumption and the mention of the usage of substances in online discourse. This provides a direct blueprint for personality-tailored public health interventions: focusing on harm reduction in social settings for individuals high in agreeableness and extraversion, while offering alternative coping strategies for the &#x201C;emotional coping&#x201D; narratives associated with neuroticism [<xref ref-type="bibr" rid="ref48">48</xref>]. Acknowledging the present study&#x2019;s limitations, future work should validate these findings across different platforms and integrate them with offline clinical data to build a more holistic and effective framework for addressing SU risk in the digital age.</p></sec><sec id="s4-7-3"><title>Policy Implications</title><p>From a policy perspective, these results underscore the importance of targeting the social drivers of SU discourse online. Prevention strategies should go beyond individual-level risk and address the communal contexts where SU is normalized, particularly among highly agreeable and extraverted users. The protective effect of neuroticism highlights the need for adaptive, data-driven monitoring that can refine early-warning systems during public health crises. Policy makers could leverage NLP-based tools for real-time trend detection while partnering with technology companies to embed harm-reduction interventions, such as in-platform nudges or targeted public service announcements. To ensure equity, these strategies must be accompanied by safeguards that protect user privacy, mitigate stigmatization, and promote algorithmic transparency. By aligning digital health policies with personality-informed insights, governments and health agencies can better anticipate, monitor, and reduce SU-related harms in the digital era.</p></sec></sec><sec id="s4-8"><title>Limitations</title><p>The findings of this study, while offering valuable insights into the dynamics of SU discourse on social media, must be interpreted in light of several important limitations.</p><p>A primary constraint stems from our reliance on probabilistic inference models to ascertain user attributes. Although our classifiers achieved approximately 80% accuracy, inferred data are proxies, not ground-truth information, and the potential for misclassification can introduce bias that propagates through the analysis. This is compounded by our use of an archival dataset from Twitter [<xref ref-type="bibr" rid="ref31">31</xref>], where data inconsistencies could impact the precision of longitudinal analyses. Furthermore, this study&#x2019;s scope is confined to English-language discourse on Twitter, which limits the generalizability of our findings to other platforms, cultures, or languages where SU expression differs.</p><p>An important conceptual limitation concerns the treatment of engagement in SU discourse as a proxy for actual SU behavior. Users may participate in substance-related discussions for social, performative, or cultural reasons without personally consuming substances. Consequently, the presence of SU-related posts should not be interpreted as definitive evidence of individual SU. While this proxy enables large-scale, population-level analyses, it constrains the ability to draw causal inferences about personal behavior and necessitates caution in interpreting associations between personality traits and SU engagement online.</p><p>Another limitation lies in the application of a personality model trained on Reddit data to Twitter users. While prior research has shown that language-based personality inference models can generalize reasonably well across platforms [<xref ref-type="bibr" rid="ref49">49</xref>], differences in user demographics, community norms, and writing styles between Reddit and Twitter may introduce systematic biases. For example, Reddit&#x2019;s longer-form discussions differ from the brevity and immediacy of tweets, which could influence the linguistic markers of personality traits. Thus, while the use of a well-validated model enables scalable personality assessment, its cross-platform application must be interpreted cautiously.</p><p>Finally, our demographic analysis is constrained by the nonrepresentative user base of Twitter, which is known to skew toward the younger and more urban. In addition, demographic inference models themselves may introduce biases. For example, gender classifiers are limited in recognizing nonbinary or gender-diverse individuals, and other attributes such as race or age may be misclassified due to sparse or ambiguous linguistic signals. Without reliable platform-wide demographic benchmarks, it is impossible to fully normalize our findings, meaning observed differences between groups could reflect both representation disparities and limitations of demographic inference rather than true behavioral patterns.</p><p>Additionally, while this study spans 2019&#x2010;2021, our focus is on understanding personality-SU relationships in online discourse, treating the pandemic as a contextual societal shock. Descriptive data from 2019 and 2021 provide a reference point, but this study does not perform formal comparisons between crisis and normal conditions; such analyses are considered a direction for future research.</p></sec><sec id="s4-9"><title>Future Work</title><p>Building on the findings and limitations of this study, several key avenues for future research emerge. These directions focus on enhancing methodological rigor, expanding the scope of analysis for greater generalizability, and integrating diverse data sources for a more holistic understanding.</p><p>First, future work should prioritize the refinement and validation of the computational models used for inference. A critical next step is to conduct rigorous domain adaptation testing to evaluate and improve the performance of models trained on one platform (Reddit) and applied to another (Twitter), as was the case for our personality classifier. This would help account for platform-specific linguistic norms and reduce potential bias. Similarly, developing more transparent and inclusive demographic inference models, trained on more diverse and representative datasets, is essential for improving the accuracy and equity of these computational tools.</p><p>Second, the scope of the research should be significantly broadened to enhance the generalizability of the findings. This involves expanding the analysis to include multiple social media platforms (such as Reddit, 2024 [<xref ref-type="bibr" rid="ref50">50</xref>], TikTok, 2024 [ByteDance] [<xref ref-type="bibr" rid="ref51">51</xref>], and Facebook, 2024 [Meta] [<xref ref-type="bibr" rid="ref52">52</xref>]) to capture a more complete picture of the digital ecosystem. Concurrently, future studies must move beyond an English-language focus by leveraging multilingual NLP models. Such an endeavor would not only provide a more global perspective on SU discourse but would also necessitate interdisciplinary collaborations with social scientists, ethicists, and researchers fluent in other languages to ensure the culturally competent application of these methods.</p><p>Finally, to overcome the inherent limitations of using social media data alone, future research should aim to triangulate computational findings with traditional offline data sources. Integrating large-scale social media analyses with clinical records, ecological momentary assessments, or targeted surveys would allow researchers to validate digital proxies against ground-truth behaviors and clinical outcomes. This mixed-methods approach would provide a much richer, multilayered understanding of the complex interplay between personality, SU, and mental health, ultimately strengthening the foundation for developing more effective and responsive public health interventions.</p></sec><sec id="s4-10"><title>Conclusions</title><p>This research fundamentally reconfigures the understanding of SU in digital spaces, revealing that online discourse is driven more by social connection than by individual distress, also supported by contemporary human behaviors research work [<xref ref-type="bibr" rid="ref29">29</xref>]. Our most significant finding is the robustly protective role of neuroticism (OR 0.29, 95% CI 0.26-0.31) against engaging in SU communities, a direct challenge to the canonical self-medication hypothesis [<xref ref-type="bibr" rid="ref43">43</xref>]. Instead of reflecting private turmoil, participation in these online discussions was most strongly predicted by the prosocial traits of agreeableness (OR 4.04, 95% CI 3.71-4.41) and extraversion (OR 3.22, 95% CI 2.98-3.49). These results suggest that on public platforms such as Twitter, especially during a crisis such as the COVID-19 pandemic, SU-related conversation often functions as a form of social bonding and affiliation rather than as a direct expression of negative affect.</p><p>Overall, this study provides a foundational basis for policy makers and public health practitioners to better understand these dynamics and to design informed, socially aware strategies for addressing SU in online spaces.</p></sec></sec></body><back><ack><p>This work is funded by the Substance Abuse and Mental Health Services Administration Strategic Prevention Framework-19 (grant 6H79SP081502). We also sincerely thank the editors and reviewers for their valuable feedback, which greatly improved the manuscript.</p></ack><notes><sec><title>Data Availability</title><p>The data and code supporting this study are publicly available on GitHub [<xref ref-type="bibr" rid="ref42">42</xref>].</p></sec></notes><fn-group><fn fn-type="con"><p>JM contributed to the conceptualization, methodology, investigation, formal analysis, model development, and writing of the original draft. RJ assisted in conceptualization and supervised this study. All authors reviewed and approved the final paper.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">HDBSCAN</term><def><p>Hierarchical Density-Based Spatial Clustering of Applications With Noise</p></def></def-item><def-item><term id="abb2">NLP</term><def><p>natural language processing</p></def></def-item><def-item><term id="abb3">OR</term><def><p>odds ratio</p></def></def-item><def-item><term id="abb4">RQ</term><def><p>research question</p></def></def-item><def-item><term id="abb5">STROBE</term><def><p>Strengthening the Reporting of Observational Studies in Epidemiology</p></def></def-item><def-item><term id="abb6">SU</term><def><p>substance use</p></def></def-item><def-item><term id="abb7">SUD</term><def><p>substance use disorder</p></def></def-item><def-item><term id="abb8">UMAP</term><def><p>Uniform Manifold Approximation and Projection</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>McCrae</surname><given-names>RR</given-names> </name><name name-style="western"><surname>Costa Jr</surname><given-names>PT</given-names> </name><name name-style="western"><surname>John</surname><given-names>OP</given-names> </name><name name-style="western"><surname>Robins</surname><given-names>RW</given-names> </name><name name-style="western"><surname>Pervin</surname><given-names>LA</given-names> </name></person-group><article-title>The five-factor theory of personality</article-title><source>Handbook of Personality: Theory and Research</source><edition>3</edition><publisher-name>The Guilford Press</publisher-name><fpage>159</fpage><lpage>181</lpage></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Terracciano</surname><given-names>A</given-names> </name><name name-style="western"><surname>L&#x00F6;ckenhoff</surname><given-names>CE</given-names> </name><name name-style="western"><surname>Crum</surname><given-names>RM</given-names> </name><name name-style="western"><surname>Bienvenu</surname><given-names>OJ</given-names> </name><name name-style="western"><surname>Costa</surname><given-names>PT</given-names>  <suffix>Jr</suffix></name></person-group><article-title>Five-factor model personality profiles of drug users</article-title><source>BMC Psychiatry</source><year>2008</year><month>04</month><day>11</day><volume>8</volume><fpage>22</fpage><pub-id pub-id-type="doi">10.1186/1471-244X-8-22</pub-id><pub-id pub-id-type="medline">18405382</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kotov</surname><given-names>R</given-names> </name><name name-style="western"><surname>Gamez</surname><given-names>W</given-names> </name><name name-style="western"><surname>Schmidt</surname><given-names>F</given-names> </name><name name-style="western"><surname>Watson</surname><given-names>D</given-names> </name></person-group><article-title>Linking &#x201C;big&#x201D; personality traits to anxiety, depressive, and substance use disorders: a meta-analysis</article-title><source>Psychol Bull</source><year>2010</year><month>09</month><volume>136</volume><issue>5</issue><fpage>768</fpage><lpage>821</lpage><pub-id pub-id-type="doi">10.1037/a0020327</pub-id><pub-id pub-id-type="medline">20804236</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Akbari</surname><given-names>M</given-names> </name><name name-style="western"><surname>Lankarani</surname><given-names>KB</given-names> </name><name name-style="western"><surname>Heydari</surname><given-names>ST</given-names> </name><name name-style="western"><surname>Motevalian</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Tabrizi</surname><given-names>R</given-names> </name><name name-style="western"><surname>Asadi-Shekari</surname><given-names>Z</given-names> </name></person-group><article-title>Meta-analysis of the correlation between personality characteristics and risky driving behaviors</article-title><source>J Inj Violence Res</source><year>2019</year><volume>11</volume><issue>2</issue><fpage>107</fpage><lpage>122</lpage><pub-id pub-id-type="doi">10.5249/jivr.v11i2.1172</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dash</surname><given-names>GF</given-names> </name><name name-style="western"><surname>Martin</surname><given-names>NG</given-names> </name><name name-style="western"><surname>Slutske</surname><given-names>WS</given-names> </name></person-group><article-title>Big Five personality traits and illicit drug use: specificity in trait-drug associations</article-title><source>Psychol Addict Behav</source><year>2023</year><month>03</month><volume>37</volume><issue>2</issue><fpage>318</fpage><lpage>330</lpage><pub-id pub-id-type="doi">10.1037/adb0000793</pub-id><pub-id pub-id-type="medline">34766786</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Turiano</surname><given-names>NA</given-names> </name><name name-style="western"><surname>Whiteman</surname><given-names>SD</given-names> </name><name name-style="western"><surname>Hampson</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Roberts</surname><given-names>BW</given-names> </name><name name-style="western"><surname>Mroczek</surname><given-names>DK</given-names> </name></person-group><article-title>Personality and substance use in midlife: conscientiousness as a moderator and the effects of trait change</article-title><source>J Res Pers</source><year>2012</year><month>06</month><day>1</day><volume>46</volume><issue>3</issue><fpage>295</fpage><lpage>305</lpage><pub-id pub-id-type="doi">10.1016/j.jrp.2012.02.009</pub-id><pub-id pub-id-type="medline">22773867</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Malouff</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Thorsteinsson</surname><given-names>EB</given-names> </name><name name-style="western"><surname>Rooke</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Schutte</surname><given-names>NS</given-names> </name></person-group><article-title>Alcohol involvement and the five-factor model of personality: a meta-analysis</article-title><source>J Drug Educ</source><year>2007</year><volume>37</volume><issue>3</issue><fpage>277</fpage><lpage>294</lpage><pub-id pub-id-type="doi">10.2190/DE.37.3.d</pub-id><pub-id pub-id-type="medline">18047183</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Marengo</surname><given-names>D</given-names> </name><name name-style="western"><surname>Poletti</surname><given-names>I</given-names> </name><name name-style="western"><surname>Settanni</surname><given-names>M</given-names> </name></person-group><article-title>The interplay between neuroticism, extraversion, and social media addiction in young adult Facebook users: testing the mediating role of online activity using objective data</article-title><source>Addict Behav</source><year>2020</year><month>03</month><volume>102</volume><issue>306-4603</issue><fpage>106150</fpage><pub-id pub-id-type="doi">10.1016/j.addbeh.2019.106150</pub-id><pub-id pub-id-type="medline">31706139</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dash</surname><given-names>GF</given-names> </name><name name-style="western"><surname>Slutske</surname><given-names>WS</given-names> </name><name name-style="western"><surname>Martin</surname><given-names>NG</given-names> </name><name name-style="western"><surname>Statham</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Agrawal</surname><given-names>A</given-names> </name><name name-style="western"><surname>Lynskey</surname><given-names>MT</given-names> </name></person-group><article-title>Big Five personality traits and alcohol, nicotine, cannabis, and gambling disorder comorbidity</article-title><source>Psychol Addict Behav</source><year>2019</year><month>06</month><volume>33</volume><issue>4</issue><fpage>420</fpage><lpage>429</lpage><pub-id pub-id-type="doi">10.1037/adb0000468</pub-id><pub-id pub-id-type="medline">31094546</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Maharjan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>J</given-names> </name><name name-style="western"><surname>King</surname><given-names>J</given-names> </name><name name-style="western"><surname>Phan</surname><given-names>N</given-names> </name><name name-style="western"><surname>Kenne</surname><given-names>D</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>R</given-names> </name></person-group><article-title>Large-scale deep learning-enabled infodemiological analysis of substance use patterns on social media: insights from the COVID-19 pandemic</article-title><source>JMIR Infodemiology</source><year>2025</year><month>04</month><day>17</day><volume>5</volume><fpage>e59076</fpage><pub-id pub-id-type="doi">10.2196/59076</pub-id><pub-id pub-id-type="medline">40244656</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="web"><article-title>The Twitter stream grab</article-title><source>Internet Archive</source><year>2021</year><access-date>2025-11-11</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://archive.org/details/twitterstream">https://archive.org/details/twitterstream</ext-link></comment></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>G</given-names> </name><name name-style="western"><surname>Schwartz</surname><given-names>HA</given-names> </name><name name-style="western"><surname>Eichstaedt</surname><given-names>JC</given-names> </name><etal/></person-group><article-title>Automatic personality assessment through social media language</article-title><source>J Pers Soc Psychol</source><year>2015</year><month>06</month><volume>108</volume><issue>6</issue><fpage>934</fpage><lpage>952</lpage><pub-id pub-id-type="doi">10.1037/pspp0000020</pub-id><pub-id pub-id-type="medline">25365036</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aschwanden</surname><given-names>D</given-names> </name><name name-style="western"><surname>Strickhouser</surname><given-names>JE</given-names> </name><name name-style="western"><surname>Sesker</surname><given-names>AA</given-names> </name><etal/></person-group><article-title>Psychological and behavioural responses to coronavirus disease 2019: the role of personality</article-title><source>Eur J Pers</source><year>2021</year><month>01</month><volume>35</volume><issue>1</issue><fpage>51</fpage><lpage>66</lpage><pub-id pub-id-type="doi">10.1002/per.2281</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pollard</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Tucker</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Green</surname><given-names>HD</given-names>  <suffix>Jr</suffix></name></person-group><article-title>Changes in adult alcohol use and consequences during the COVID-19 pandemic in the US</article-title><source>JAMA Netw Open</source><year>2020</year><month>09</month><day>1</day><volume>3</volume><issue>9</issue><fpage>e2022942</fpage><pub-id pub-id-type="doi">10.1001/jamanetworkopen.2020.22942</pub-id><pub-id pub-id-type="medline">32990735</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kuntsche</surname><given-names>E</given-names> </name><name name-style="western"><surname>Knibbe</surname><given-names>R</given-names> </name><name name-style="western"><surname>Gmel</surname><given-names>G</given-names> </name><name name-style="western"><surname>Engels</surname><given-names>R</given-names> </name></person-group><article-title>Who drinks and why? A review of socio-demographic, personality, and contextual issues behind the drinking motives in young people</article-title><source>Addict Behav</source><year>2006</year><month>10</month><volume>31</volume><issue>10</issue><fpage>1844</fpage><lpage>1857</lpage><pub-id pub-id-type="doi">10.1016/j.addbeh.2005.12.028</pub-id><pub-id pub-id-type="medline">16460883</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Khantzian</surname><given-names>EJ</given-names> </name></person-group><article-title>The self-medication hypothesis of substance use disorders: a reconsideration and recent applications</article-title><source>Harv Rev Psychiatry</source><year>1997</year><volume>4</volume><issue>5</issue><fpage>231</fpage><lpage>244</lpage><pub-id pub-id-type="doi">10.3109/10673229709030550</pub-id><pub-id pub-id-type="medline">9385000</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>de Wit</surname><given-names>H</given-names> </name></person-group><article-title>Impulsivity as a determinant and consequence of drug use: a review of underlying processes</article-title><source>Addict Biol</source><year>2009</year><month>01</month><volume>14</volume><issue>1</issue><fpage>22</fpage><lpage>31</lpage><pub-id pub-id-type="doi">10.1111/j.1369-1600.2008.00129.x</pub-id><pub-id pub-id-type="medline">18855805</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Getzmann</surname><given-names>S</given-names> </name><name name-style="western"><surname>Digutsch</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kleinsorge</surname><given-names>T</given-names> </name></person-group><article-title>COVID-19 pandemic and personality: agreeable people are more stressed by the feeling of missing</article-title><source>Int J Environ Res Public Health</source><year>2021</year><month>10</month><day>13</day><volume>18</volume><issue>20</issue><fpage>10759</fpage><pub-id pub-id-type="doi">10.3390/ijerph182010759</pub-id><pub-id pub-id-type="medline">34682500</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Argyriou</surname><given-names>E</given-names> </name><name name-style="western"><surname>Um</surname><given-names>M</given-names> </name><name name-style="western"><surname>Carron</surname><given-names>C</given-names> </name><name name-style="western"><surname>Cyders</surname><given-names>MA</given-names> </name></person-group><article-title>Age and impulsive behavior in drug addiction: a review of past research and future directions</article-title><source>Pharmacol Biochem Behav</source><year>2018</year><month>01</month><volume>164</volume><fpage>106</fpage><lpage>117</lpage><pub-id pub-id-type="doi">10.1016/j.pbb.2017.07.013</pub-id><pub-id pub-id-type="medline">28778737</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Smrdu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kuder</surname><given-names>A</given-names> </name><name name-style="western"><surname>Turk</surname><given-names>E</given-names> </name><name name-style="western"><surname>&#x010C;elik</surname><given-names>T</given-names> </name><name name-style="western"><surname>&#x0160;et</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kralj-Fi&#x0161;er</surname><given-names>S</given-names> </name></person-group><article-title>COVID-19 pandemic and lockdown: associations with personality and stress components</article-title><source>Psychol Rep</source><year>2023</year><month>04</month><volume>126</volume><issue>2</issue><fpage>727</fpage><lpage>758</lpage><pub-id pub-id-type="doi">10.1177/00332941211043451</pub-id><pub-id pub-id-type="medline">34674582</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kashdan</surname><given-names>TB</given-names> </name><name name-style="western"><surname>Vetter</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Collins</surname><given-names>RL</given-names> </name></person-group><article-title>Substance use in young adults: associations with personality and gender</article-title><source>Addict Behav</source><year>2005</year><month>02</month><volume>30</volume><issue>2</issue><fpage>259</fpage><lpage>269</lpage><pub-id pub-id-type="doi">10.1016/j.addbeh.2004.05.014</pub-id><pub-id pub-id-type="medline">15621397</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schulz</surname><given-names>N</given-names> </name><name name-style="western"><surname>Murphy</surname><given-names>B</given-names> </name><name name-style="western"><surname>Verona</surname><given-names>E</given-names> </name></person-group><article-title>Gender differences in psychopathy links to drug use</article-title><source>Law Hum Behav</source><year>2016</year><month>04</month><volume>40</volume><issue>2</issue><fpage>159</fpage><lpage>168</lpage><pub-id pub-id-type="doi">10.1037/lhb0000165</pub-id><pub-id pub-id-type="medline">26571339</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schwartz</surname><given-names>HA</given-names> </name><name name-style="western"><surname>Eichstaedt</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Kern</surname><given-names>ML</given-names> </name><etal/></person-group><article-title>Personality, gender, and age in the language of social media: the open-vocabulary approach</article-title><source>PLoS ONE</source><year>2013</year><volume>8</volume><issue>9</issue><fpage>e73791</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0073791</pub-id><pub-id pub-id-type="medline">24086296</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aldao</surname><given-names>A</given-names> </name><name name-style="western"><surname>Nolen-Hoeksema</surname><given-names>S</given-names> </name><name name-style="western"><surname>Schweizer</surname><given-names>S</given-names> </name></person-group><article-title>Emotion-regulation strategies across psychopathology: a meta-analytic review</article-title><source>Clin Psychol Rev</source><year>2010</year><month>03</month><volume>30</volume><issue>2</issue><fpage>217</fpage><lpage>237</lpage><pub-id pub-id-type="doi">10.1016/j.cpr.2009.11.004</pub-id><pub-id pub-id-type="medline">20015584</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roos</surname><given-names>JM</given-names> </name></person-group><article-title>The Intersection of personality traits and social media usage: large-scale representative samples of internet users in Sweden</article-title><source>Psych</source><year>2023</year><volume>5</volume><issue>1</issue><fpage>70</fpage><lpage>79</lpage><pub-id pub-id-type="doi">10.3390/psych5010008</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Seabrook</surname><given-names>EM</given-names> </name><name name-style="western"><surname>Kern</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Rickard</surname><given-names>NS</given-names> </name></person-group><article-title>Social networking sites, depression, and anxiety: a systematic review</article-title><source>JMIR Ment Health</source><year>2016</year><month>11</month><day>23</day><volume>3</volume><issue>4</issue><fpage>e50</fpage><pub-id pub-id-type="doi">10.2196/mental.5842</pub-id><pub-id pub-id-type="medline">27881357</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Oudin</surname><given-names>A</given-names> </name><name name-style="western"><surname>Maatoug</surname><given-names>R</given-names> </name><name name-style="western"><surname>Bourla</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Digital phenotyping: data-driven psychiatry to redefine mental health</article-title><source>J Med Internet Res</source><year>2023</year><month>10</month><day>4</day><volume>25</volume><fpage>e44502</fpage><pub-id pub-id-type="doi">10.2196/44502</pub-id><pub-id pub-id-type="medline">37792430</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zong</surname><given-names>H</given-names> </name><etal/></person-group><article-title>The comprehensive clinical benefits of digital phenotyping: from broad adoption to full impact</article-title><source>NPJ Digit Med</source><year>2025</year><month>04</month><day>8</day><volume>8</volume><issue>1</issue><fpage>196</fpage><pub-id pub-id-type="doi">10.1038/s41746-025-01602-5</pub-id><pub-id pub-id-type="medline">40195396</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roos</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Jansson</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bjerkeli</surname><given-names>PJ</given-names> </name></person-group><article-title>Who are the online medication shoppers? A market segmentation of the Swedish welfare state</article-title><source>JTAER</source><year>2024</year><volume>19</volume><issue>1</issue><fpage>526</fpage><lpage>537</lpage><pub-id pub-id-type="doi">10.3390/jtaer19010028</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>von Elm</surname><given-names>E</given-names> </name><name name-style="western"><surname>Altman</surname><given-names>DG</given-names> </name><name name-style="western"><surname>Egger</surname><given-names>M</given-names> </name><name name-style="western"><surname>Pocock</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>G&#x00F8;tzsche</surname><given-names>PC</given-names> </name><name name-style="western"><surname>Vandenbroucke</surname><given-names>JP</given-names> </name></person-group><article-title>The Strengthening the Reporting of Observational Studies in Epidemiology (STROBE) statement: guidelines for reporting observational studies</article-title><source>Lancet</source><year>2007</year><month>10</month><volume>370</volume><issue>9596</issue><fpage>1453</fpage><lpage>1457</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(07)61602-X</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="web"><article-title>Commonly abused drugs chart</article-title><source>National Institute on Drug Abuse</source><access-date>2025-11-11</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://nida.nih.gov/sites/default/files/cadchart.pdf">https://nida.nih.gov/sites/default/files/cadchart.pdf</ext-link></comment></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Ott</surname><given-names>M</given-names> </name><name name-style="western"><surname>Goyal</surname><given-names>N</given-names> </name><name name-style="western"><surname>Du</surname><given-names>J</given-names> </name><name name-style="western"><surname>Joshi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>D</given-names> </name><etal/></person-group><article-title>RoBERTa: a robustly optimized BERT pretraining approach</article-title><source>arXiv</source><comment>Preprint posted online on  Jul 26, 2019</comment><pub-id pub-id-type="doi">10.48550/arXiv.1907.11692</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Hale</surname><given-names>S</given-names> </name><name name-style="western"><surname>Adelani</surname><given-names>DI</given-names> </name><etal/></person-group><article-title>Demographic inference and representative population estimates from multilingual social media data</article-title><year>2019</year><month>05</month><day>13</day><conf-name>WWW &#x2019;19</conf-name><conf-date>May 13-17, 2019</conf-date><pub-id pub-id-type="doi">10.1145/3308558.3313684</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Alhuzali</surname><given-names>H</given-names> </name><name name-style="western"><surname>Ananiadou</surname><given-names>S</given-names> </name></person-group><article-title>SpanEmo: casting multi-label emotion classification as span-prediction</article-title><source>Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics</source><pub-id pub-id-type="doi">10.18653/v1/2021.eacl-main.135</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hutto</surname><given-names>C</given-names> </name><name name-style="western"><surname>Gilbert</surname><given-names>E</given-names> </name></person-group><article-title>VADER: a parsimonious rule-based model for sentiment analysis of social media text</article-title><source>ICWSM</source><year>2014</year><volume>8</volume><issue>1</issue><fpage>216</fpage><lpage>225</lpage><pub-id pub-id-type="doi">10.1609/icwsm.v8i1.14550</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Maharjan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>R</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kenne</surname><given-names>D</given-names> </name></person-group><article-title>Do large language models really understand personality?</article-title><source>J Med Internet Res</source><comment>Preprint posted online on 2025</comment><pub-id pub-id-type="doi">10.2196/75347</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Gjurkovi&#x0107;</surname><given-names>M</given-names> </name><name name-style="western"><surname>Karan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Vukojevi&#x0107;</surname><given-names>I</given-names> </name><name name-style="western"><surname>Bo&#x0161;njak</surname><given-names>M</given-names> </name><name name-style="western"><surname>&#x0160;najder</surname><given-names>J</given-names> </name></person-group><article-title>PANDORA talks: personality and demographics on reddit</article-title><source>arXiv</source><comment>Preprint posted online on  Jun 8, 2020</comment><pub-id pub-id-type="doi">10.48550/arXiv.2004.04460</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Grootendorst</surname><given-names>M</given-names> </name></person-group><article-title>BERTopic: neural topic modeling with a class-based TF-IDF procedure</article-title><source>arXiv</source><comment>Preprint posted online on  Mar 11, 2022</comment><pub-id pub-id-type="doi">10.48550/arXiv.2203.05794</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="web"><article-title>OpenAI</article-title><source>GPT-4 technical report</source><year>2023</year><access-date>2025-11-11</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://openai.com/research/gpt-4">https://openai.com/research/gpt-4</ext-link></comment></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Maharjan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Jin</surname><given-names>R</given-names> </name><name name-style="western"><surname>King</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kenne</surname><given-names>D</given-names> </name></person-group><article-title>Differential analysis of age, gender, race, sentiment, and emotion in substance use discourse on Twitter during the COVID-19 pandemic: a natural language processing approach</article-title><source>JMIR Infodemiology</source><year>2025</year><month>07</month><day>28</day><volume>5</volume><fpage>e67333</fpage><pub-id pub-id-type="doi">10.2196/67333</pub-id><pub-id pub-id-type="medline">40720823</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hicks</surname><given-names>BM</given-names> </name><name name-style="western"><surname>Schalet</surname><given-names>BD</given-names> </name><name name-style="western"><surname>Malone</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Iacono</surname><given-names>WG</given-names> </name><name name-style="western"><surname>McGue</surname><given-names>M</given-names> </name></person-group><article-title>Psychometric and genetic architecture of substance use disorder and behavioral disinhibition measures for gene association studies</article-title><source>Behav Genet</source><year>2011</year><month>07</month><volume>41</volume><issue>4</issue><fpage>459</fpage><lpage>475</lpage><pub-id pub-id-type="doi">10.1007/s10519-010-9417-2</pub-id><pub-id pub-id-type="medline">21153693</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jacobs</surname><given-names>P</given-names> </name><name name-style="western"><surname>Viechtbauer</surname><given-names>W</given-names> </name></person-group><article-title>Estimation of the biserial correlation and its sampling variance for use in meta-analysis</article-title><source>Res Synth Methods</source><year>2017</year><month>06</month><volume>8</volume><issue>2</issue><fpage>161</fpage><lpage>180</lpage><pub-id pub-id-type="doi">10.1002/jrsm.1218</pub-id><pub-id pub-id-type="medline">27631635</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="book"><person-group person-group-type="editor"><name name-style="western"><surname>Eysenck</surname><given-names>HJ</given-names> </name></person-group><source>Experiments with Drugs: Studies in the Relation between Personality, Learning Theory and Drug Action</source><year>2013</year><publisher-name>Elsevier</publisher-name><pub-id pub-id-type="doi">10.1192/bjp.110.466.450-a</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="web"><article-title>Personalitytraitondrugusers</article-title><source>GitHub repository</source><access-date>2025-11-11</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/JulinaM/PersonalityTraitOnDrugUsers">https://github.com/JulinaM/PersonalityTraitOnDrugUsers</ext-link></comment></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schmitt</surname><given-names>DP</given-names> </name><name name-style="western"><surname>Long</surname><given-names>AE</given-names> </name><name name-style="western"><surname>McPhearson</surname><given-names>A</given-names> </name><name name-style="western"><surname>O&#x2019;Brien</surname><given-names>K</given-names> </name><name name-style="western"><surname>Remmert</surname><given-names>B</given-names> </name><name name-style="western"><surname>Shah</surname><given-names>SH</given-names> </name></person-group><article-title>Personality and gender differences in global perspective</article-title><source>Int J Psychol</source><year>2017</year><month>12</month><volume>52 Suppl 1</volume><issue>Suppl 1</issue><fpage>45</fpage><lpage>56</lpage><pub-id pub-id-type="doi">10.1002/ijop.12265</pub-id><pub-id pub-id-type="medline">27000535</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Cooper</surname><given-names>ML</given-names> </name><name name-style="western"><surname>Kuntsche</surname><given-names>E</given-names> </name><name name-style="western"><surname>Levitt</surname><given-names>A</given-names> </name><name name-style="western"><surname>Barber</surname><given-names>LL</given-names> </name><name name-style="western"><surname>Wolf</surname><given-names>S</given-names> </name></person-group><article-title>Motivational models of substance use: a review of theory and research on motives for using alcohol, marijuana, and tobacco</article-title><source>The Oxford Handbook of Substance Use and Substance Use Disorders</source><year>2016</year><volume>1</volume><fpage>375</fpage><lpage>421</lpage></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kaufman</surname><given-names>SB</given-names> </name><name name-style="western"><surname>Quilty</surname><given-names>LC</given-names> </name><name name-style="western"><surname>Grazioplene</surname><given-names>RG</given-names> </name><etal/></person-group><article-title>Openness to experience and intellect differentially predict creative achievement in the arts and sciences</article-title><source>J Pers</source><year>2016</year><month>04</month><volume>84</volume><issue>2</issue><fpage>248</fpage><lpage>258</lpage><pub-id pub-id-type="doi">10.1111/jopy.12156</pub-id><pub-id pub-id-type="medline">25487993</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Curtis</surname><given-names>B</given-names> </name><name name-style="western"><surname>Giorgi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ungar</surname><given-names>L</given-names> </name><etal/></person-group><article-title>AI-based analysis of social media language predicts addiction treatment dropout at 90 days</article-title><source>Neuropsychopharmacology</source><year>2023</year><month>10</month><volume>48</volume><issue>11</issue><fpage>1579</fpage><lpage>1585</lpage><pub-id pub-id-type="doi">10.1038/s41386-023-01585-5</pub-id><pub-id pub-id-type="medline">37095253</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Peters</surname><given-names>H</given-names> </name><name name-style="western"><surname>Matz</surname><given-names>SC</given-names> </name></person-group><article-title>Large language models can infer psychological dispositions of social media users</article-title><source>PNAS Nexus</source><year>2024</year><month>06</month><volume>3</volume><issue>6</issue><fpage>gae231</fpage><pub-id pub-id-type="doi">10.1093/pnasnexus/pgae231</pub-id><pub-id pub-id-type="medline">38948324</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="web"><source>Reddit</source><year>2024</year><access-date>2025-12-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.reddit.com">https://www.reddit.com</ext-link></comment></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="web"><source>TikTok</source><year>2024</year><access-date>2025-12-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.tiktok.com">https://www.tiktok.com</ext-link></comment></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="web"><source>Facebook</source><year>2024</year><access-date>2025-12-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.facebook.com">https://www.facebook.com</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Checklist 1</label><p>STROBE Checklist</p><media xlink:href="jmir_v27i1e79454_app1.pdf" xlink:title="PDF File, 109 KB"/></supplementary-material></app-group></back></article>