<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<?covid-19-tdm?>
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v24i10e37258</article-id>
      <article-id pub-id-type="pmid">36219757</article-id>
      <article-id pub-id-type="doi">10.2196/37258</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Sexually Transmitted Disease–Related Reddit Posts During the COVID-19 Pandemic: Latent Dirichlet Allocation Analysis</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Basch</surname>
            <given-names>Corey</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Tsao</surname>
            <given-names>Shu-Feng</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Rovetta</surname>
            <given-names>Alessandro</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Johnson</surname>
            <given-names>Amy K</given-names>
          </name>
          <degrees>MSW, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>The Potocsnak Family Division of Adolescent and Young Adult Medicine</institution>
            <institution>Ann &#38; Robert H. Lurie Children's Hospital of Chicago</institution>
            <addr-line>225 E Chicago</addr-line>
            <addr-line>Box 161</addr-line>
            <addr-line>Chicago, IL, 60611</addr-line>
            <country>United States</country>
            <phone>1 3122277733</phone>
            <email>akjohnson@luriechildrens.org</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4247-455X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Bhaumik</surname>
            <given-names>Runa</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0553-1340</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Nandi</surname>
            <given-names>Debarghya</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0246-4602</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Roy</surname>
            <given-names>Abhishikta</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7924-2261</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Mehta</surname>
            <given-names>Supriya D</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7926-2489</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>The Potocsnak Family Division of Adolescent and Young Adult Medicine</institution>
        <institution>Ann &#38; Robert H. Lurie Children's Hospital of Chicago</institution>
        <addr-line>Chicago, IL</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Feinberg School of Medicine</institution>
        <institution>Northwestern University</institution>
        <addr-line>Chicago, IL</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>School of Public Health</institution>
        <institution>University of Illinois at Chicago</institution>
        <addr-line>Chicago, IL</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Rush University</institution>
        <addr-line>Chicago, IL</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Amy K Johnson <email>akjohnson@luriechildrens.org</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>10</month>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>31</day>
        <month>10</month>
        <year>2022</year>
      </pub-date>
      <volume>24</volume>
      <issue>10</issue>
      <elocation-id>e37258</elocation-id>
      <history>
        <date date-type="received">
          <day>12</day>
          <month>2</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>31</day>
          <month>7</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>1</day>
          <month>9</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>20</day>
          <month>9</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Amy K Johnson, Runa Bhaumik, Debarghya Nandi, Abhishikta Roy, Supriya D Mehta. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 31.10.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2022/10/e37258" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Sexually transmitted diseases (STDs) are common and costly, impacting approximately 1 in 5 people annually. Reddit, the sixth most used internet site in the world, is a user-generated social media discussion platform that may be useful in monitoring discussion about STD symptoms and exposure.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study sought to define and identify patterns and insights into STD-related discussions on Reddit over the course of the COVID-19 pandemic.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We extracted posts from Reddit from March 2019 through July 2021. We used a topic modeling method, Latent Dirichlet Allocation, to identify the most common topics discussed in the Reddit posts. We then used word clouds, qualitative topic labeling, and spline regression to characterize the content and distribution of the topics observed.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our extraction resulted in 24,311 total posts. Latent Dirichlet Allocation topic modeling showed that with 8 topics for each time period, we achieved high coherence values (pre–COVID-19=0.41, prevaccination=0.42, and postvaccination=0.44). Although most topic categories remained the same over time, the relative proportion of topics changed and new topics emerged. Spline regression revealed that some key terms had variability in the percentage of posts that coincided with pre–COVID-19 and post–COVID-19 periods, whereas others were uniform across the study periods.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our study’s use of Reddit is a novel way to gain insights into STD symptoms experienced, potential exposures, testing decisions, common questions, and behavior patterns (eg, during lockdown periods). For example, reduction in STD screening may result in observed negative health outcomes due to missed cases, which also impacts onward transmission. As Reddit use is anonymous, users may discuss sensitive topics with greater detail and more freely than in clinical encounters. Data from anonymous Reddit posts may be leveraged to enhance the understanding of the distribution of disease and need for targeted outreach or screening programs. This study provides evidence in favor of establishing Reddit as having feasibility and utility to enhance the understanding of sexual behaviors, STD experiences, and needed health engagement with the public.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>infodemiology</kwd>
        <kwd>Latent Dirichlet Allocation</kwd>
        <kwd>natural language processing</kwd>
        <kwd>Reddit</kwd>
        <kwd>sexually transmitted infections</kwd>
        <kwd>surveillance</kwd>
        <kwd>social media</kwd>
        <kwd>COVID-19</kwd>
        <kwd>social media content</kwd>
        <kwd>content analysis</kwd>
        <kwd>health outcome</kwd>
        <kwd>infoveillance</kwd>
        <kwd>health information</kwd>
        <kwd>sexually transmitted disease</kwd>
        <kwd>STD</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>More than 2.5 million cases of chlamydia, gonorrhea, and syphilis were reported in 2019, with sexually transmitted diseases (STD) cases reaching an all-time high for the sixth consecutive year in the United States [<xref ref-type="bibr" rid="ref1">1</xref>]. STDs are common and costly, impacting approximately 1 in 5 people annually and accounting for US $16 billion in annual health care costs [<xref ref-type="bibr" rid="ref2">2</xref>]. New data from the Centers for Disease Control and Prevention demonstrate that during the start of the COVID-19 pandemic (from March to April 2020), reported STD cases dramatically decreased compared to the same time in 2019. At that point, the current cumulative totals for STD cases compared to 2019 were 1% lower for primary and secondary syphilis, 7% lower for gonorrhea, and 14% lower for chlamydia [<xref ref-type="bibr" rid="ref3">3</xref>]. Although case reports were lower for the first part of 2020, cases rebounded later in the year and were on track to surpass 2019 totals [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
      <p>Multiple factors likely contributed to the observed decrease in reported STD cases during the early phases of the COVID-19 pandemic. Restrictions of in-person clinic visits resulted in reduced screening of asymptomatic patients. The Centers for Disease Control and Prevention provided guidance for sexual health services to prioritize patients based on symptoms and risk, along with delaying routine screening until after the emergency response [<xref ref-type="bibr" rid="ref4">4</xref>]. Many health department staff were redeployed from STD tracking to COVID-19 contact tracing and control [<xref ref-type="bibr" rid="ref5">5</xref>]; 57% of disease intervention specialists reported that they were reassigned from STD to COVID-19 services, limiting the workforce available to provide STD prevention, screening, and treatment [<xref ref-type="bibr" rid="ref5">5</xref>]. Finally, national stay-at-home orders were issued during phases of the pandemic that were designed to reduce the spread of COVID-19 but may also have reduced STD transmission by reducing sexual behavior outside of the household, limiting the number of new sexual partners, and restricting sexual networks [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
      <p>Recent estimates indicate that 80% of all internet users report accessing health information on the web [<xref ref-type="bibr" rid="ref7">7</xref>]. As the internet can be accessed anonymously and at any time, users can seek STD information and resources confidentially, which may facilitate more frequent and open disclosure of symptoms and exposure experiences [<xref ref-type="bibr" rid="ref8">8</xref>]. Reddit, the sixth most used internet site in the world, is a user-generated social media discussion platform that may be useful in monitoring discussion about STD symptoms and exposure [<xref ref-type="bibr" rid="ref9">9</xref>]. Reddit is considered one of the most authentic web spaces as there are safeguards against “bot accounts” and rich communication occurs without the barrier of requiring demographic or identifying information to join [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Prior health research has established that Reddit is an acceptable platform to conduct scientific investigations [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. Topic-specific Reddit discussions (subreddits) dedicated to discussing sexual health and STDs may provide valuable insight to exposure, symptoms, testing, and sexual behavior during the COVID-19 pandemic. Prior analyses of Reddit discussion content have been conducted across different diseases and health conditions, including smoking cessation, atopic dermatitis, suicide, and pregnancy [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. To derive meaningful and replicable information from Reddit discussion content, the complexity of high-volume text data needs numerical structure implemented in an unbiased way. Latent Dirichlet Allocation (LDA) is a natural language processing method that identifies common words and topics in text and allows experts to assess common themes among findings [<xref ref-type="bibr" rid="ref14">14</xref>]. This study sought to define and identify patterns and insights into STD-related discussions on Reddit via LDA over the course of the COVID-19 pandemic. Our team hypothesized that there would be an increase in the volume of STD-related posts on Reddit and the variation of topics during the COVID-19 pandemic compared to the prepandemic period due to behavior changes during the COVID-19 pandemic.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethics Approval</title>
        <p>The study protocol was determined to be nonhuman subjects research by the Ann &#38; Robert H. Lurie Children’s Hospital Institutional Review Board (IRB#2022-4964) because of the use of publicly available, nonidentifiable data.</p>
      </sec>
      <sec>
        <title>Data Extraction</title>
        <p>This study used publicly available data from the web-based discussion forum, Reddit. Reddit is an anonymous social media site that is user-generated and discussion-based. The site is organized into “subreddits” that are content-specific. Posts were extracted from 2 subreddits: “STD” (r/STD) and “sexual health”(r/sexualhealth). However, due to the small number of posts in r/sexual health, we only used the subreddit r/STD in our analysis. The <italic>pushshift</italic> Reddit application programming interface was used for searching Reddit comments and submissions [<xref ref-type="bibr" rid="ref15">15</xref>]. Reddit’s official application programming interface (Reddit 2021) was used to collect posts and associated metadata (date) from r/STD and r/sexualhealth from March 2019 to July 2021, resulting in 24,311 posts [<xref ref-type="bibr" rid="ref10">10</xref>]. Only English-language posts were included in the analysis. <xref rid="figure1" ref-type="fig">Figure 1</xref> displays the number of posts that were extracted from each subreddit for the time frames used in the analysis. “Pre–COVID-19” was defined as ranging from March 2019 to February 2020 (8421 posts); “COVID-19, prevaccination” was defined as ranging from April to December 2020 (8169 posts); “COVID-19, postvaccination” was defined as ranging from January to July 2021 (6908 posts); and an inflection period was defined as March 2020 (813 posts). Based on the most current literature, we reasonably supposed the absence of seasonality in sexually transmitted infection (STI) cases [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>].</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Distribution of volume of posts for study time periods from March 2019 to July 2021, resulting in a total of 24,311 posts.</p>
          </caption>
          <graphic xlink:href="jmir_v24i10e37258_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Preprocessing</title>
        <p>Data preprocessing steps were conducted following common approaches in natural language processing [<xref ref-type="bibr" rid="ref18">18</xref>]. Preprocessing eliminates some of the inconsistencies in the data and reduces the content to useable text. In all, 4 preprocessing steps were completed on each line from the text file to extract and clean each title, body, and comment separately: (1) the removal of URLs, (2) tokenization, (3) punctuation and stop word removal, and (4) lemmatization [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>].</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <sec>
          <title>LDA Topic Modeling</title>
          <p>We used an increasingly popular topic modeling method, LDA, to conduct a text analysis identifying the most common topics discussed in the Reddit posts [<xref ref-type="bibr" rid="ref22">22</xref>]. LDA is a statistical generative model that discovers latent semantic topics in large collections of text documents (posts in our study), where each document results from random mixtures over latent topics and each topic is characterized by a distribution over words. The model is presented in plate notation in <xref rid="figure2" ref-type="fig">Figure 2</xref> [<xref ref-type="bibr" rid="ref14">14</xref>]. Both the topics and words have a Dirichlet prior distribution, respectively, with α being the parameter of the per-document Dirichlet prior on the topics, and β being the parameter of the per-word Dirichlet prior on the words.  θ<sub>m</sub> is the topic distribution for document m. ϕ<sub>k</sub> is the word distribution for topic k. Z<sub>nm</sub> is the topic for the nth word in the mth document. W<sub>nm</sub> is the actual nth word in the mth document. Considering the nature of its structure, LDA is a multiple-level hierarchical Bayesian model.</p>
          <p>To conduct the LDA, we converted the corpus to a document-term matrix, comprising rows representing original posts and columns representing each word in the corpus. Each cell in the document-term matrix contains the frequency of times a specific word (defined by the column) occurred in a specific post (defined by the row). From this document-term matrix, the entire corpus was represented, including patterns of words that commonly occur together within the same post. We used the <italic>gensim</italic> library to perform LDA model estimation, which determined sets of words that appeared frequently together in posts across sexual health subreddits [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
          <p>The LDA model then outputs a topic-document matrix, representing the relative importance of each topic in each document. Models were applied to pre–COVID-19 posts from March 2019 to February 2020 (8421 posts), prevaccination posts from April to December 2020 (8169 posts), and postvaccination posts from January to July 2021 (6908 posts; <xref rid="figure3" ref-type="fig">Figure 3</xref>). For topic modeling, we excluded posts for the inflection period (March 2020; 813 posts).</p>
          <p>A key process in LDA is to estimate the optimal number of topics. To estimate the number of topics, we used the topic coherence index, which is the most consistent measure of human interpretability [<xref ref-type="bibr" rid="ref23">23</xref>]. Topic coherence measures score a single topic by measuring the degree of semantic similarity between high-scoring words in the topic. These measurements help distinguish between topics that are semantically interpretable topics and topics that are artifacts of statistical inference. The higher the topic coherence score, the better the quality of the model. To avoid overfit and sparsity and improve inference, we selected the number of topics as 8. Topics were reviewed and labeled independently by 2 experts in STD epidemiology and control (AKJ and SDM). Once independent review was completed, labels were discussed until consensus was reached, resulting in 100% agreement.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Latent Dirichlet Allocation in plate notation (adapted from Blei et al [<xref ref-type="bibr" rid="ref14">14</xref>]).</p>
            </caption>
            <graphic xlink:href="jmir_v24i10e37258_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Latent Dirichlet Allocation topic modeling on multiple time periods: (A) pre–COVID-19, (B) prevaccination, and (C) postvaccination.</p>
            </caption>
            <graphic xlink:href="jmir_v24i10e37258_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Word Cloud</title>
          <p>A word cloud is a text visualization technique that focuses on the frequency of words and correlates the size and opacity of a word to its frequency within a text body. The output is usually an image that depicts different words in different sizes and opacities relative to the word frequency. Separate frames were created for posts containing the following terms: chlamydia, gonorrhea, syphilis, gonorrhea/discharge/dysuria, and syphilis/chancre/ulcer. After data preprocessing was completed, each string was passed to the <italic>WordCloud</italic> function in Python to generate a word cloud [<xref ref-type="bibr" rid="ref24">24</xref>]. For <italic>WordCloud</italic> visualization, we chose 3 etiologic terms (chlamydia, gonorrhea, and syphilis) and 3 of the most common terminologies from the topic search: herpes/herpes simplex virus (HSV)/human papillomavirus (HPV; as a single topic, due to correlations), diagnosis/testing, and STI/STD. Each separate word cloud was formed by searching each word in the topic.</p>
        </sec>
        <sec>
          <title>Spline Regression Plots</title>
          <p>Spline regression modeling has become popular in applied clinical research. Modern biostatistics makes use of spline regression to model smooth functions such as time series, cumulative effects, and frequency distributions and in survival analysis. Spline regression is used to overcome the difficulties of linear and polynomial regression algorithms. In linear regression, the entire data set is considered once. Polynomial regression can express a particular amount of curvature in a nonlinear relationship, but in spline regression (a nonparametric regression), the data set is divided into bins. Each bin of the data is fitted with separate models. The points where the data are divided into bins are called knots. In simpler words, splines are piecewise polynomial functions. To identify patterns in the change of the proportion of posts related to certain search terms relative to the total number of posts in a particular month over the entire study period (spanning from March 2019 to July 2021), a spline plot was created. The pre-COVID-19; inflection; COVID-19, prevaccination; and COVID-19, postvaccination periods were highlighted on the plots for a better understanding of search trends across time. The plots were created using <italic>ggplot2</italic> package in R statistical software (R Foundation for Statistical Computing) [<xref ref-type="bibr" rid="ref25">25</xref>]. For spline regression, we used a cubic B-spline basis with 2 boundary knots and 1 interior knot placed at the median of the observed data values. As with the word clouds, we created 3 plots based on etiology (chlamydia, gonorrhea, and syphilis) and 3 plots based on common topics (diagnose/test/tested, herpes/HSV/HPV, and gonorrhea/dysuria/discharge). A detailed review of spline regression using R software can be found in Perperoglou et al [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Reddit Posts</title>
        <p>Of the 24,311 posts, the average number of posts per month were 701.75 during the pre–COVID-19 period; 907.67 during the COVID-19, prevaccination period; and 863.50 during the COVID-19, postvaccination period, but there was substantial variability from month to month and within each time period. The average number of posts per month per period demonstrated growth in subreddit volume during COVID-19. <xref rid="figure4" ref-type="fig">Figure 4</xref> displays the number of posts per month by observation period. May 2019 consisted of 210 posts and August 2021 consisted of 169 posts, which were 2 of the lowest volumes recorded and were both preceded by 2 months of high-volume posts.</p>
        <p>LDA topic modeling showed that with 8 topics for each time period, we achieved high coherence values (pre–COVID-19=0.41, prevaccination=0.42, and postvaccination=0.44). <xref rid="figure5" ref-type="fig">Figure 5</xref> shows the distribution of topic posts in pre–COVID-19, prevaccination, and postvaccination “STD” and “sexual health” subreddits over the 8 topics extracted using LDA. Although most topic categories remained the same over time, the relative proportion of topics changed and new topics emerged. In the pre–COVID-19 period, a general category of “STD Risk” emerged with no specific etiology or mention of symptoms with words such as “negative” and “exposure” in the top 10 terms associated with the topic (<xref ref-type="table" rid="table1">Table 1</xref>). “HPV” and “warts” as terms did not appear in the pre–COVID-19 period. There was specific language surrounding herpes symptoms (eg, “outbreak”) and diagnosis (eg, testing and positive or negative) and the introduction of “HSV” in the postvaccination period, whereas words used in conjunction with herpes in previous periods were primarily related to images and nonspecific symptoms (eg, “redness” and “bumps”; <xref ref-type="table" rid="table2">Table 2</xref>). Moreover, although the “herpes image” topic category included nonspecific symptoms (eg, “bump” and “redness”), this categorization diverged during COVID-19 periods, with a topic category emerging for penile “bump” without the mention of herpes. In the postvaccination period, the “oral sex/STD questioning” topic included the term “penis”; although this topic existed in the other 2 periods, it did not include “penis” as a top 10 term (<xref ref-type="table" rid="table3">Table 3</xref>).</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Average number of Reddit posts per month, by period.</p>
          </caption>
          <graphic xlink:href="jmir_v24i10e37258_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Distribution of posts: the proportion of documents that are assigned to each topic. STD: sexually transmitted disease; HPV: human papillomavirus.</p>
          </caption>
          <graphic xlink:href="jmir_v24i10e37258_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Pre–COVID-19 topics and the top 10 terms derived from a Latent Dirichlet Allocation model created from 3 different time periods: pre–COVID-19, prevaccination, and postvaccination.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="270"/>
            <col width="730"/>
            <thead>
              <tr valign="top">
                <td>Topic</td>
                <td>Top 10 terms</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Testing, no specific etiology</td>
                <td>day, test, week, negative, feel, take, pain, still, exposure, also</td>
              </tr>
              <tr valign="top">
                <td>Herpes image</td>
                <td>com, imgur, penis, sex, STD<sup>a</sup>, help, really, day, condom, herpes</td>
              </tr>
              <tr valign="top">
                <td>Oral sex/STD questioning</td>
                <td>sex, oral, day, ago, STD, know, condom, unprotected, time, penis</td>
              </tr>
              <tr valign="top">
                <td>Penile “bump”</td>
                <td>com, imgur, bump, look, red, penis, herpes, week, day, spot</td>
              </tr>
              <tr valign="top">
                <td>Diagnosis/doctor (results)</td>
                <td>test, say, back, doctor, look, hepatitis, come, herpes, throat, negative</td>
              </tr>
              <tr valign="top">
                <td>Diagnosis/chlamydia</td>
                <td>test, sex, chlamydia, week, month, symptom, come, back, time, partner</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>STD: sexually transmitted disease.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Prevaccination topics and the top 10 terms derived from a Latent Dirichlet Allocation model created from 3 different time periods: pre–COVID-19, prevaccination, and postvaccination.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="270"/>
            <col width="730"/>
            <thead>
              <tr valign="top">
                <td>Topic</td>
                <td>Top 10 terms</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Oral sex/STD<sup>a</sup> questioning</td>
                <td>sex, oral, come, week, test, day, know, back, STD, time</td>
              </tr>
              <tr valign="top">
                <td>HPV<sup>b</sup>/warts treatment, herpes questioning</td>
                <td>test, sex, HPV, time, year, condom, month, ago, last, say</td>
              </tr>
              <tr valign="top">
                <td>Diagnosis/chlamydia</td>
                <td>test, take, symptom, day, week, know, say, back, chlamydia, doctor</td>
              </tr>
              <tr valign="top">
                <td>Testing, no specific etiology image</td>
                <td>day, month, feel, start, sex, doctor, pain, take, test, thing</td>
              </tr>
              <tr valign="top">
                <td>Diagnosis (results)</td>
                <td>test, positive, negative, sex, chlamydia, result, herpes, partner, day, month</td>
              </tr>
              <tr valign="top">
                <td>Penile “bump” symptom (no pictures, no herpes)</td>
                <td>com, imgur, bump, help, penis, look, know, pimple, hurt, think</td>
              </tr>
              <tr valign="top">
                <td>Herpes image</td>
                <td>imgur, com, herpes, bump, red, penis, help, day, look, month</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>STD: sexually transmitted disease.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>HPV: human papillomavirus.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Postvaccination topics and the top 10 terms derived from a Latent Dirichlet Allocation model created from 3 different time periods: pre–COVID-19, prevaccination, and postvaccination.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="270"/>
            <col width="730"/>
            <thead>
              <tr valign="top">
                <td>Topic</td>
                <td>Top 10 terms</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Herpes symptoms/diagnosis</td>
                <td>test, herpes, HSV<sup>a</sup>, sex, know, outbreak, negative, positive, genital, risk</td>
              </tr>
              <tr valign="top">
                <td>Herpes image</td>
                <td>com, imgur, herpes, sex, look, help, remove, know, oral, bump</td>
              </tr>
              <tr valign="top">
                <td>HPV<sup>b</sup>/warts treatment, herpes questioning</td>
                <td>wart, herpes, ibb_co, com, www_reddit, comment, remove, HPV, month, skin</td>
              </tr>
              <tr valign="top">
                <td>Diagnosis/chlamydia</td>
                <td>day, month, feel, start, sex, doctor, pain, take, test, thing</td>
              </tr>
              <tr valign="top">
                <td>Testing, no specific etiology</td>
                <td>test, remove, STD, day, sex, week, negative, help, time, oral</td>
              </tr>
              <tr valign="top">
                <td>Penile “bump” symptom (no pictures, no herpes)</td>
                <td>penis, bump, sex, day, know, STD<sup>c</sup>, feel, look, condom, time</td>
              </tr>
              <tr valign="top">
                <td>Oral sex/STD questioning</td>
                <td>sex, know, test, week, say, think, time, symptom, oral, tell</td>
              </tr>
              <tr valign="top">
                <td>Penile “bump” symptom</td>
                <td>bump, com, look, imgur, week, ago, day, penis, red, notice</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>HSV: herpes simplex virus.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>HPV: human papillomavirus.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>STD: sexually transmitted disease.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Word Clouds</title>
        <p>Although the terms in the topic models listed above are informative, we used <italic>WordCloud</italic> visualizations to better understand the relative importance of these words within each topic based on etiology and general terms over the study period. The terms that appear larger appeared more frequently within the topic, whereas the terms in smaller font appeared less frequently. <xref rid="figure6" ref-type="fig">Figure 6</xref>A-F displays the word clouds for 6 specific topics; for example, <xref rid="figure6" ref-type="fig">Figure 6</xref>E displays terms clustered with herpes/HSV/HPV such as “imgur” (denoting that a picture was uploaded), “bump,” “pain,” and “outbreak.”</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Word clouds by key term: (A) syphilis, (B) diagnosis/testing, (C) STI/STD, (D) gonorrhea, (E) herpes/HSV/HPV, and (F) chlamydia. HPV: human papillomavirus; HSV: herpes simplex virus; STD: sexually transmitted disease; STI: sexually transmitted infection.</p>
          </caption>
          <graphic xlink:href="jmir_v24i10e37258_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Spline Regressions</title>
        <p>As shown in the series of spline regressions in <xref rid="figure7" ref-type="fig">Figure 7</xref>A-F, there is some variability in the percentage of posts by key terms over the study periods. Although some regressions are “flat” (ie, uniform) across the study periods, others display variability that coincides with the COVID-19 periods. For example, <xref rid="figure7" ref-type="fig">Figure 7</xref>F displays the regression for posts with the key terms “diagnose/test/tested.” There is some variability in the percentage of posts in the different COVID-19 periods, with the pre–COVID-19 and postvaccination volumes being similar to each other and the prevaccination period having a lower percentage of posts. We tested the significance of the differences between the pre–COVID-19 and post–COVID-19 frequency of posts for 6 key terms (<xref ref-type="table" rid="table4">Table 4</xref>). There are statistically significant differences for herpes and syphilis, with post–COVID-19 frequencies being higher than pre–COVID-19 frequencies.</p>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Percentage of Reddit posts containing specific key terms from March 2019 to July 2021: (A) gonorrhea, (B) chlamydia, (C) syphilis, (D) gonorrhea/dysuria/discharge, (E) herpes/HSV/HPV, and (F) diagnose/test/tested. HPV: human papillomavirus; HSV: herpes simplex virus.</p>
          </caption>
          <graphic xlink:href="jmir_v24i10e37258_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Comparing the differences between the pre–COVID-19 and post-COVID-19 frequencies of posts.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="230"/>
            <col width="270"/>
            <col width="320"/>
            <col width="180"/>
            <thead>
              <tr valign="top">
                <td>Key term</td>
                <td>Pre–COVID-19, frequency</td>
                <td>Post–COVID-19, frequency</td>
                <td><italic>P</italic> value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Chlamydia</td>
                <td>35.27</td>
                <td>43.47</td>
                <td>.08</td>
              </tr>
              <tr valign="top">
                <td>Gonorrhea</td>
                <td>14.25</td>
                <td>15.56</td>
                <td>.64</td>
              </tr>
              <tr valign="top">
                <td>Herpes</td>
                <td>118.75</td>
                <td>160.47</td>
                <td>.01</td>
              </tr>
              <tr valign="top">
                <td>Syphilis</td>
                <td>12.92</td>
                <td>21.23</td>
                <td>.005</td>
              </tr>
              <tr valign="top">
                <td>Test/diagnosis</td>
                <td>78</td>
                <td>97.65</td>
                <td>.08</td>
              </tr>
              <tr valign="top">
                <td>Gonorrhea/dysuria</td>
                <td>25.33</td>
                <td>30.47</td>
                <td>.28</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Our study provides evidence that there was an increase in the volume of STD-related posts during the COVID-19 pandemic periods and there were changes in the topics posted in STD-related subreddits from pre–COVID-19 through COVID-19, prevaccination and COVID-19, postvaccination periods. The changes in topics discussed likely relate to behavior changes due to COVID-19–related lockdowns, restrictions on in-person gatherings, and the closing of nonessential medical services [<xref ref-type="bibr" rid="ref27">27</xref>]. Regardless of lockdown status, people still engage in sexual behavior (eg, condomless sex) that will expose them to STDs. However, with the reduction of STD testing or treatment, these cases are not reflected in surveillance numbers. It is important to understand the sexual health experiences of communities, including symptoms, questions, and behavior patterns, to plan for screening and treatment options.</p>
        <p>Our results found that “STD risk” as a topic and general “risk” terms as words only appeared in the pre–COVID-19 time period, whereas “HPV” and “warts” only appeared in the COVID-19, prevaccination and postvaccination periods. During the pre–COVID-19 time period, users generated posts related to general STD risk and sexual behavior, seeking advice and support for understanding STD exposure risk for specific sexual behavior or partnership choices. During the 2 COVID-19 periods, this general “STD risk” topic no longer appeared, demonstrating a difference in content—moving from general discussions to specific symptom or etiology-based posts. During the 2 COVID-19 periods, HPV/warts emerged as a topic. This finding may be due to increased effort to self-diagnosis symptoms experienced as a result of limited access to diagnostic services. Although reported STD cases declined during the initial lockdown period, cases reported in 2020 quickly rebounded and exceed the case numbers in 2019 [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
        <p>Our study’s use of Reddit is a novel way to gain insights into STD symptoms experienced, potential exposures, testing decisions, common questions, and behavior patterns (eg, during lockdown periods). For example, reduction in STD screening may result in observed negative health outcomes due to missed cases, which also impacts onward transmission. The reduction in access to STD testing and treatment during COVID-19 intensified existing barriers to sexual health care, including stigma, judgement, cost, and accessibility [<xref ref-type="bibr" rid="ref28">28</xref>]. It is important that STD services be maintained, either through telehealth and in-home testing options or via clinic services with COVID-19 mitigation procedures in place (screening, masking, and social distancing).</p>
        <p>As Reddit use is anonymous, users may discuss sensitive topics with greater detail and more freely than in clinical encounters. The sexual health subreddits had an average volume of unique posts ranging from approximately 700 to 900 per month; thus, Reddit is a frequently used source of information that could guide the understanding of the behavior, symptoms, and common questions of patients. Sexual health care workers should consider collaboration with Reddit or other social media outlets to leverage the potential benefits of these platforms (anonymous, free, and rapid response) while mitigating harm (incorrect diagnoses and faulty recommendations) [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Study results should be interpreted while considering the following limitations. LDA is an unsupervised approach with no gold standard to compare to. However, we analyzed the LDA output qualitatively with the use of 2 independent coders and reached 100% consensus on manual topic labels. As we used posts from an open web-based forum, we were unable to validate users; however, there is little incentive to be dishonest or to post false information on health-related subreddits. Reddit users tend to be younger and are more likely to be male compared to the larger US population; however, other demographic trends (eg, race/ethnicity) mirror the distribution in the United States [<xref ref-type="bibr" rid="ref30">30</xref>]. As men and Black or African American and Latino communities are often underrepresented in STI case data, it is important to gain an understanding of their sexual health needs and experiences via alternative data sources [<xref ref-type="bibr" rid="ref30">30</xref>]. Finally, the precise location of Reddit users are unknown. Although we were able to extract posts limited to the United States and those in the English language, we cannot pinpoint post volume by specific state or local jurisdiction.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>This study demonstrates Reddit as having feasibility and utility to enhance the understanding of sexual behaviors, STD experiences, and needed health engagement with the public. It is important to prioritize efforts to reduce the spread and impact of STDs through surveillance, screening, and treatment. The COVID-19 pandemic and subsequent stay-at-home orders highlight a critical need for increased access to STD clinics and STD information. Data from anonymous Reddit posts may be leveraged to enhance the understanding of the distribution of disease and need for targeted outreach or screening programs.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">HPV</term>
          <def>
            <p>human papillomavirus</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">HSV</term>
          <def>
            <p>herpes simplex virus</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">LDA</term>
          <def>
            <p>Latent Dirichlet Allocation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">STD</term>
          <def>
            <p>sexually transmitted disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">STI</term>
          <def>
            <p>sexually transmitted infection</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <article-title>Sexually Transmitted Disease Surveillance 2019</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <access-date>2022-10-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/std/statistics/2019/">https://www.cdc.gov/std/statistics/2019/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <article-title>Sexually transmitted infections prevalence, incidence, and cost estimates in the United States</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <year>2021</year>
          <month>02</month>
          <day>18</day>
          <access-date>2022-10-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/std/statistics/prevalence-incidence-cost-2020.htm">https://www.cdc.gov/std/statistics/prevalence-incidence-cost-2020.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pagaoa</surname>
              <given-names>Melissa</given-names>
            </name>
            <name name-style="western">
              <surname>Grey</surname>
              <given-names>Jeremy</given-names>
            </name>
            <name name-style="western">
              <surname>Torrone</surname>
              <given-names>Elizabeth</given-names>
            </name>
            <name name-style="western">
              <surname>Kreisel</surname>
              <given-names>Kristen</given-names>
            </name>
            <name name-style="western">
              <surname>Stenger</surname>
              <given-names>Mark</given-names>
            </name>
            <name name-style="western">
              <surname>Weinstock</surname>
              <given-names>Hillard</given-names>
            </name>
          </person-group>
          <article-title>Trends in nationally notifiable sexually transmitted disease case reports during the US COVID-19 pandemic, January to December 2020</article-title>
          <source>Sex Transm Dis</source>
          <year>2021</year>
          <month>10</month>
          <day>01</day>
          <volume>48</volume>
          <issue>10</issue>
          <fpage>798</fpage>
          <lpage>804</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34224523"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/OLQ.0000000000001506</pub-id>
          <pub-id pub-id-type="medline">34224523</pub-id>
          <pub-id pub-id-type="pii">00007435-900000000-97626</pub-id>
          <pub-id pub-id-type="pmcid">PMC8459909</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bachmann</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Thorpe</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bolan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Mermin</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>STD treatment options</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <year>2020</year>
          <month>04</month>
          <day>06</day>
          <access-date>2022-10-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/nchhstp/dear_colleague/2020/dcl-040620-std-treatment-options.html">https://www.cdc.gov/nchhstp/dear_colleague/2020/dcl-040620-std-treatment-options.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="web">
          <article-title>COVID-19 and the state of the STD field</article-title>
          <source>National Coalition of STD Directors</source>
          <year>2020</year>
          <month>05</month>
          <day>12</day>
          <access-date>2022-10-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ncsddc.org/resource/covid-19-and-the-state-of-the-std-field/">https://www.ncsddc.org/resource/covid-19-and-the-state-of-the-std-field/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rushmore</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Copen</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lamuda</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>BG</given-names>
            </name>
            <name name-style="western">
              <surname>Kirkcaldy</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>KT</given-names>
            </name>
          </person-group>
          <article-title>Partner seeking and sexual behavior in the United States during the COVID-19 pandemic, March 2020 to March 2021</article-title>
          <source>Sexual Trans Dis</source>
          <year>2021</year>
          <month>11</month>
          <day>12</day>
          <volume>49</volume>
          <issue>4</issue>
          <fpage>e57</fpage>
          <lpage>e60</lpage>
          <pub-id pub-id-type="doi">10.1097/olq.0000000000001582</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dugan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Health online 2013</article-title>
          <source>Pew Research Center</source>
          <year>2013</year>
          <month>01</month>
          <day>15</day>
          <access-date>2022-10-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.pewresearch.org/internet/2013/01/15/health-online-2013/">https://www.pewresearch.org/internet/2013/01/15/health-online-2013/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Mikati</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>SD</given-names>
            </name>
          </person-group>
          <article-title>Examining the themes of STD-related Internet searches to increase specificity of disease forecasting using internet search terms</article-title>
          <source>Sci Rep</source>
          <year>2016</year>
          <month>11</month>
          <day>09</day>
          <volume>6</volume>
          <fpage>36503</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/srep36503"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/srep36503</pub-id>
          <pub-id pub-id-type="medline">27827386</pub-id>
          <pub-id pub-id-type="pii">srep36503</pub-id>
          <pub-id pub-id-type="pmcid">PMC5101501</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>KE</given-names>
            </name>
          </person-group>
          <article-title>Ask me anything: what is Reddit?</article-title>
          <source>Library Hi Tech News</source>
          <year>2015</year>
          <month>07</month>
          <day>06</day>
          <volume>32</volume>
          <issue>5</issue>
          <fpage>8</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1108/lhtn-03-2015-0018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Silberman</surname>
              <given-names>WR</given-names>
            </name>
            <name name-style="western">
              <surname>Record</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <article-title>We post it, U Reddit: exploring the potential of reddit for health interventions targeting college populations</article-title>
          <source>J Health Commun</source>
          <year>2021</year>
          <month>06</month>
          <day>03</day>
          <volume>26</volume>
          <issue>6</issue>
          <fpage>381</fpage>
          <lpage>390</lpage>
          <pub-id pub-id-type="doi">10.1080/10810730.2021.1949648</pub-id>
          <pub-id pub-id-type="medline">34260329</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kurtti</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jagedo</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Analysis of Reddit reveals dupilumab questions among atopic dermatitis patients</article-title>
          <source>J Drugs Dermatol</source>
          <year>2022</year>
          <month>03</month>
          <day>01</day>
          <volume>21</volume>
          <issue>3</issue>
          <fpage>292</fpage>
          <lpage>294</lpage>
          <pub-id pub-id-type="doi">10.36849/JDD.5942</pub-id>
          <pub-id pub-id-type="medline">35254758</pub-id>
          <pub-id pub-id-type="pii">S1545961622P0292X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pilkington</surname>
              <given-names>PD</given-names>
            </name>
            <name name-style="western">
              <surname>Bedford-Dyer</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Mothers' worries during pregnancy: a content analysis of Reddit posts</article-title>
          <source>J Perinat Educ</source>
          <year>2021</year>
          <month>04</month>
          <day>01</day>
          <volume>30</volume>
          <issue>2</issue>
          <fpage>98</fpage>
          <lpage>107</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33897234"/>
          </comment>
          <pub-id pub-id-type="doi">10.1891/J-PE-D-20-00018</pub-id>
          <pub-id pub-id-type="medline">33897234</pub-id>
          <pub-id pub-id-type="pii">jpe.30.2.98</pub-id>
          <pub-id pub-id-type="pmcid">PMC8061722</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mason</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Morley</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Scarf</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Collings</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Riordan</surname>
              <given-names>BC</given-names>
            </name>
          </person-group>
          <article-title>A content analysis of Reddit users' perspectives on reasons for not following through with a suicide attempt</article-title>
          <source>Cyberpsychol Behav Soc Netw</source>
          <year>2021</year>
          <month>10</month>
          <volume>24</volume>
          <issue>10</issue>
          <fpage>642</fpage>
          <lpage>647</lpage>
          <pub-id pub-id-type="doi">10.1089/cyber.2020.0521</pub-id>
          <pub-id pub-id-type="medline">33601950</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>MI</given-names>
            </name>
          </person-group>
          <article-title>Latent dirichlet allocation</article-title>
          <source>J Mach Learn Res</source>
          <year>2003</year>
          <month>03</month>
          <day>01</day>
          <volume>3</volume>
          <fpage>993</fpage>
          <lpage>1022</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/volume3/blei03a/blei03a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baumgartner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zannettou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Keegan</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Squire</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Blackburn</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The pushshift Reddit dataset</article-title>
          <year>2020</year>
          <month>05</month>
          <day>26</day>
          <conf-name>Fourteenth International AAAI Conference on Web and Social Media (ICWSM-20)</conf-name>
          <conf-date>June 8-11, 2019</conf-date>
          <conf-loc>Atlanta, GA</conf-loc>
          <fpage>830</fpage>
          <lpage>839</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ojs.aaai.org/index.php/ICWSM/article/view/7347"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mohseni</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Benard</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Mead-Harvey</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lindor</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Sheele</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Sexually transmitted infections in the emergency department are not associated with holidays or school breaks</article-title>
          <source>Am J Emerg Med</source>
          <year>2021</year>
          <month>07</month>
          <volume>45</volume>
          <fpage>642</fpage>
          <lpage>644</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ajem.2020.11.020</pub-id>
          <pub-id pub-id-type="medline">33246859</pub-id>
          <pub-id pub-id-type="pii">S0735-6757(20)31028-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Smolensky</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Burau</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Cech</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Recent change in the annual pattern of sexually transmitted diseases in the United States</article-title>
          <source>Chronobiol Int</source>
          <year>2007</year>
          <volume>24</volume>
          <issue>5</issue>
          <fpage>947</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1080/07420520701648325</pub-id>
          <pub-id pub-id-type="medline">17994348</pub-id>
          <pub-id pub-id-type="pii">783648416</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vijayarani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ilamathi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nithya</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Preprocessing techniques for text mining - an overview</article-title>
          <source>International Journal of Computer Science &#38; Communication Networks</source>
          <year>2015</year>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>7</fpage>
          <lpage>16</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.ttcenter.ir/ArticleFiles/ENARTICLE/3783.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Řehůřek</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sojka</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Gensim–python framework for vector space modelling</article-title>
          <source>NLP Centre, Faculty of Informatics, Masaryk University, Brno, Czech Republic</source>
          <year>2011</year>
          <volume>3</volume>
          <issue>2</issue>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Loper</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bird</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>NLTK: the natural language toolkit</article-title>
          <source>Association for Computational Linguistics</source>
          <year>2002</year>
          <month>07</month>
          <day>07</day>
          <conf-name>ETMTNLP '02: ACL-02 Workshop on Effective tools and methodologies for teaching natural language processing and computational linguistics</conf-name>
          <conf-date>July 7, 2002</conf-date>
          <conf-loc>Philadelphia, PA</conf-loc>
          <fpage>63</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.3115/1118108.1118117</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Honnibal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Montani</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Natural language understanding with Bloom embeddings, convolutional neural networks and incremental parsing. Unpublished software application</article-title>
          <source>spaCy</source>
          <year>2017</year>
          <access-date>2022-10-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://spacy.io">https://spacy.io</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Collaborative topic modeling for recommending scientific articles</article-title>
          <year>2011</year>
          <month>08</month>
          <day>21</day>
          <conf-name>KDD '11: 17th ACM SIGKDD international conference on Knowledge discovery and data mining</conf-name>
          <conf-date>August 21-24, 2011</conf-date>
          <conf-loc>San Diego, CA</conf-loc>
          <fpage>448</fpage>
          <lpage>456</lpage>
          <pub-id pub-id-type="doi">10.1145/2020408.2020480</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Röder</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Both</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hinneburg</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Exploring the space of topic coherence measures</article-title>
          <year>2015</year>
          <month>02</month>
          <day>02</day>
          <conf-name>WSDM '15: Eighth ACM International Conference on Web Search and Data Mining</conf-name>
          <conf-date>February 2-6, 2015</conf-date>
          <conf-loc>Shanghai, China</conf-loc>
          <fpage>399</fpage>
          <lpage>408</lpage>
          <pub-id pub-id-type="doi">10.1145/2684822.2685324</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mueller</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>wordcloud 1.8.2.2</article-title>
          <source>Python Package Index</source>
          <year>2013</year>
          <access-date>2021-11-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pypi.python.org/pypi/wordcloud">https://pypi.python.org/pypi/wordcloud</ext-link>
            <ext-link ext-link-type="webcite" xlink:href="6oD8n8hqa"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wickham</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <source>ggplot2: Elegant Graphics for Data Analysis</source>
          <year>2016</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perperoglou</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sauerbrei</surname>
              <given-names>Willi</given-names>
            </name>
            <name name-style="western">
              <surname>Abrahamowicz</surname>
              <given-names>Michal</given-names>
            </name>
            <name name-style="western">
              <surname>Schmid</surname>
              <given-names>Matthias</given-names>
            </name>
          </person-group>
          <article-title>A review of spline function procedures in R</article-title>
          <source>BMC Med Res Methodol</source>
          <year>2019</year>
          <month>03</month>
          <day>06</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>46</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/s12874-019-0666-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12874-019-0666-3</pub-id>
          <pub-id pub-id-type="medline">30841848</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12874-019-0666-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC6402144</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nagendra</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Carnevale</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Neu</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Cohall</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zucker</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The potential impact and availability of sexual health services during the COVID-19 pandemic</article-title>
          <source>Sex Transm Dis</source>
          <year>2020</year>
          <month>07</month>
          <volume>47</volume>
          <issue>7</issue>
          <fpage>434</fpage>
          <lpage>436</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32520878"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/OLQ.0000000000001198</pub-id>
          <pub-id pub-id-type="medline">32520878</pub-id>
          <pub-id pub-id-type="pii">00007435-202007000-00003</pub-id>
          <pub-id pub-id-type="pmcid">PMC7448722</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Napoleon</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Maynard</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Almonte</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Silva</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Toma</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>CT</given-names>
            </name>
            <name name-style="western">
              <surname>Cormier</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Strong</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>PA</given-names>
            </name>
          </person-group>
          <article-title>Impact of the COVID-19 pandemic on sexually transmitted infection clinic visits</article-title>
          <source>Sex Transm Dis</source>
          <year>2021</year>
          <month>01</month>
          <volume>48</volume>
          <issue>1</issue>
          <fpage>e5</fpage>
          <lpage>e7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33181578"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/OLQ.0000000000001306</pub-id>
          <pub-id pub-id-type="medline">33181578</pub-id>
          <pub-id pub-id-type="pii">00007435-202101000-00013</pub-id>
          <pub-id pub-id-type="pmcid">PMC7736141</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nobles</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Leas</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Althouse</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Longhurst</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Ayers</surname>
              <given-names>JW</given-names>
            </name>
          </person-group>
          <article-title>Requests for diagnoses of sexually transmitted diseases on a social media platform</article-title>
          <source>JAMA</source>
          <year>2019</year>
          <month>11</month>
          <day>05</day>
          <volume>322</volume>
          <issue>17</issue>
          <fpage>1712</fpage>
          <lpage>1713</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31688875"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.2019.14390</pub-id>
          <pub-id pub-id-type="medline">31688875</pub-id>
          <pub-id pub-id-type="pii">2753884</pub-id>
          <pub-id pub-id-type="pmcid">PMC6865226</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sattelberg</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>The demographics Of Reddit: who uses the site?</article-title>
          <source>Alphr</source>
          <year>2021</year>
          <month>04</month>
          <day>06</day>
          <access-date>2021-11-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.alphr.com/demographics-reddit/#:~:text=According%20to%20data%20collected%20in,percent%20were%2065%20or%20older">https://www.alphr.com/demographics-reddit/#:~:text=According%20to%20data%20collected%20in,percent%20were%2065%20or%20older</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
