<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v21i8e14077</article-id>
      <article-id pub-id-type="pmid">31452514</article-id>
      <article-id pub-id-type="doi">10.2196/14077</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Stroke Survivors on Twitter: Sentiment and Topic Analysis From a Gender Perspective</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Gore</surname>
            <given-names>Ross</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Subirats</surname>
            <given-names>Laia</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kiritchenko</surname>
            <given-names>Svetlana</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Garcia-Rudolph</surname>
            <given-names>Alejandro</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Institut Guttmann Hospital de Neurorehabilitacio</institution>
            <addr-line>Camí de Can Ruti, s / n</addr-line>
            <addr-line>Badalona, 08916</addr-line>
            <country>Spain</country>
            <phone>34 934977700</phone>
            <email>alejandropablogarcia@gmail.com</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-0853-8334</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Laxe</surname>
            <given-names>Sara</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3688-8825</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Saurí</surname>
            <given-names>Joan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-0572-0459</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Bernabeu Guitart</surname>
            <given-names>Montserrat</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-2037-3069</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Institut Guttmann Hospital de Neurorehabilitacio</institution>
        <addr-line>Badalona</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Universitat Autònoma de Barcelona</institution>
        <addr-line>Bellaterra (Cerdanyola del Vallès)</addr-line>
        <country>Spain</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Fundació Institut d’Investigació en Ciències de la Salut Germans Trias i Pujol</institution>
        <addr-line>Badalona</addr-line>
        <country>Spain</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Alejandro Garcia-Rudolph 
        <email>alejandropablogarcia@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection"><month>08</month><year>2019</year></pub-date>
      <pub-date pub-type="epub">
        <day>26</day>
        <month>08</month>
        <year>2019</year>
      </pub-date>
      <volume>21</volume>
      <issue>8</issue>
      <elocation-id>e14077</elocation-id>
      <history>
        <date date-type="received">
          <day>23</day>
          <month>3</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>18</day>
          <month>4</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>11</day>
          <month>6</month>
          <year>2019</year>
        </date>
        <date date-type="accepted">
          <day>16</day>
          <month>6</month>
          <year>2019</year>
        </date>
      </history>
      <copyright-statement>©Alejandro Garcia-Rudolph, Sara Laxe, Joan Saurí, Montserrat Bernabeu Guitart. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 26.08.2019.</copyright-statement>
      <copyright-year>2019</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://www.jmir.org/2019/8/e14077/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="Background">
          <title>Background</title>
          <p>Stroke is the worldwide leading cause of long-term disabilities. Women experience more activity limitations, worse health-related quality of life, and more poststroke depression than men. Twitter is increasingly used by individuals to broadcast their day-to-day happenings, providing unobtrusive access to samples of spontaneously expressed opinions on all types of topics and emotions.</p>
        </sec>
        <sec sec-type="Objective">
          <title>Objective</title>
          <p>This study aimed to consider the raw frequencies of words in the collection of tweets posted by a sample of stroke survivors and to compare the posts by gender of the survivor for 8 basic emotions (anger, fear, anticipation, surprise, joy, sadness, trust and disgust); determine the proportion of each emotion in the collection of tweets and statistically compare each of them by gender of the survivor; extract the main topics (represented as sets of words) that occur in the collection of tweets, relative to each gender; and assign happiness scores to tweets and topics (using a well-established tool) and compare them by gender of the survivor.</p>
        </sec>
        <sec sec-type="Methods">
          <title>Methods</title>
          <p>We performed sentiment analysis based on a state-of-the-art lexicon (National Research Council) with <italic>syuzhet</italic> R package. The emotion scores for men and women were first subjected to an F-test and then to a Wilcoxon rank sum test. We extended the emotional analysis, assigning happiness scores with the hedonometer (a tool specifically designed considering Twitter inputs). We calculated daily happiness average scores for all tweets. We created a term map for an exploratory clustering analysis using VosViewer software. We performed structural topic modelling with <italic>stm</italic> R package, allowing us to identify main topics by gender. We assigned happiness scores to all the words defining the main identified topics and compared them by gender.</p>
        </sec>
        <sec sec-type="Results">
          <title>Results</title>
          <p>We analyzed 800,424 tweets posted from August 1, 2007 to December 1, 2018, by 479 stroke survivors: Women (n=244) posted 396,898 tweets, and men (n=235) posted 403,526 tweets. The stroke survivor condition and gender as well as membership in at least 3 stroke-specific Twitter lists of active users were manually verified for all 479 participants. Their total number of tweets since 2007 was 5,257,433; therefore, we analyzed the most recent 15.2% of all their tweets. Positive emotions (anticipation, trust, and joy) were significantly higher (<italic>P</italic>&lt;.001) in women, while negative emotions (disgust, fear, and sadness) were significantly higher (<italic>P</italic>&lt;.001) in men in the analysis of raw frequencies and proportion of emotions. Happiness mean scores throughout the considered period show higher levels of happiness in women. We calculated the top 20 topics (with percentages and CIs) more likely addressed by gender and found that women’s topics show higher levels of happiness scores.</p>
        </sec>
        <sec sec-type="Conclusions">
          <title>Conclusions</title>
          <p>We applied two different approaches—the Plutchik model and hedonometer tool—to a sample of stroke survivors’ tweets. We conclude that women express positive emotions and happiness much more than men.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>stroke</kwd>
        <kwd>emotions</kwd>
        <kwd>Twitter</kwd>
        <kwd>infodemiology</kwd>
        <kwd>infoveillance</kwd>
        <kwd>sentiment analysis</kwd>
        <kwd>topic models</kwd>
        <kwd>gender</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>General Background</title>
        <p>Tweets can contain information about the mood of their authors. Even when users are not specifically posting about their personal emotive status, the message can reflect their mood. As such, tweets are regarded as microscopic instantiations of emotions. Twitter has been extensively analyzed for health-related conditions. Nevertheless, to the best of our knowledge, no study has been conducted in chronic stroke, with a focus on the emotional aspects and topics addressed by stroke survivors.</p>
      </sec>
      <sec>
        <title>Stroke in Young Adults</title>
        <p>Stroke is the third leading cause of long-term disability and one of the leading causes of depression worldwide [<xref ref-type="bibr" rid="ref1">1</xref>]. Evidence suggests that stroke incidence in young adults is increasing in high-income countries [<xref ref-type="bibr" rid="ref2">2</xref>]. It has been recently reported that ischemic stroke is no longer a disease affecting just elderly people, and an estimated 3.6 million young people (age&lt;55 years) are affected each year [<xref ref-type="bibr" rid="ref3">3</xref>]. The burden of stroke in young people may be increasing further, since multiple recent studies have reported increasing incidence of ischemic strokes, particularly at younger ages, while the incidence at older ages has been declining during the same period [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        <p>Globally, almost half of the entire stroke burden is on young individuals, as they have a greater likelihood to survive strokes, with long life spans ahead, and because strokes occur at younger ages in low- and middle-income countries [<xref ref-type="bibr" rid="ref5">5</xref>]. Moreover, the overall population burden of cerebrovascular disease in young people may be underestimated, since clinically silent infarcts and white-matter changes are prevalent even in young stroke patients [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
        <p>About one-fourth of ischemic strokes occur in working-aged individuals in high-income countries, with the incidence increasing worldwide in this age group from the 1980s to present [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
      </sec>
      <sec>
        <title>Gender Differences in Stroke Outcomes</title>
        <p>After experiencing a stroke, women experience more activity limitations, worse health-related quality of life (HRQoL), and more poststroke depression than men, as recently reported in an updated systematic review of sex differences [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
        <p>Recent research published in January 2019 in the European Journal of Neurology reported that women are twice as likely to suffer from severe depression following a stroke than men. Ayis and colleagues [<xref ref-type="bibr" rid="ref8">8</xref>] followed the progression of symptoms over 5 years after stroke onset in 2313 people (1275 men and 1038 women) from the South London Stroke Register and found that 20% of women suffered from severe depression compared to 10% of men [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
        <p>The higher prevalence of depression among women may reflect a higher prevalence in the general population, where depression was identified as the leading cause of disease burden in women worldwide [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
      </sec>
      <sec>
        <title>#Stroke</title>
        <p>The expansion of social media has changed the way in which patients, physicians, and other health care stakeholders interact [<xref ref-type="bibr" rid="ref10">10</xref>]. Twitter has led to the development of disease-specific communities that can categorize and aggregate their interactions using “hashtags.” These Twitter communities serve as readily accessible, no-cost platforms that provide significant educational and professional benefits.</p>
        <p>Within stroke medicine, social media, specifically, Twitter has been recently highlighted for its potential to benefit patients, stroke organizations, and medical education [<xref ref-type="bibr" rid="ref11">11</xref>].</p>
        <p>The stroke-related Twitter network has been recently studied [<xref ref-type="bibr" rid="ref12">12</xref>], through 621,653 tweets containing the #Stroke hashtag from March 20, 2012, to January 31, 2018, in relation to tweet content, activity metrics, engagement, and user characteristics. The most commonly discussed topics were prevention, diabetes, atrial fibrillation, aphasia, dementia, thrombectomy devices, thrombolysis, and tobacco. Specifically, the content of discussions included recognition of the signs of a stroke, associated risk factors (eg, atrial fibrillation, heart disease, and diabetes), and findings of peer-reviewed journals regarding stroke treatment. Tweets were mainly composed by advocacy/support organizations (21.5%), physicians (8.4%), individuals not known to be directly working in the health care industry (14.0%), other health care professionals (5.5%), organizations related to research/academia (2.3%), and academics (2.2%), while stroke patients contributed to 6.7% of tweets (n=41,822). There was a similar proportion of total tweets with the #Stroke hashtag generated by physicians (8.4%) and patients (6.7%) during the study period and apparent minimal network communication between physicians and patients, as reported in the study conclusions [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
      </sec>
      <sec>
        <title>Emotional Distress in the Adjustment Process for Stroke Survivors</title>
        <p>Brennan emphasizes the importance of assumptions in adapting to the world around us. According to Brennan’s model, we each have a cognitive map or representation of the world, resulting from our social and cultural context and the accumulation of our life experience. This highly complex “assumptive world” is biologically adaptive in that it allows us to anticipate and plan for the future [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
        <p>In the case of a typical stroke patient, their assumptive world will almost always be challenged or disconfirmed by the experience of stroke and its immediate repercussions [<xref ref-type="bibr" rid="ref14">14</xref>]. As Brennan states, “adjusting core assumptions involves huge amounts of cognitive processing and emotional distress, this often leads to acute emotional difficulties, such as feelings of confusion, loss, sadness and anger.”</p>
        <p>Moreover, the experience of stroke and disability may also confirm previously held negative beliefs for some individuals (eg, “I am worthless” or “Others see me as weak”) and may lead to emotional distress in this manner [<xref ref-type="bibr" rid="ref14">14</xref>].</p>
      </sec>
      <sec>
        <title>Spontaneous, Emotional Language, and Everyday Topic Discussions on Twitter</title>
        <p>Over the last few years, Twitter has become a notable data source in sociolinguistics, as it captures opinions and sentiments on a wide range of topics. Although Twitter users are a self-selected group, it has been argued that analyses of Twitter data produce results congruent with those obtained using standard research methods and data sources [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
        <p>Considering the frequent use of emotional language in tweets that relate to everyday experiences [<xref ref-type="bibr" rid="ref16">16</xref>], for a large proportion of the population, Twitter provides unobtrusive access to time-sensitive and ecologically valid samples of spontaneously expressed emotions [<xref ref-type="bibr" rid="ref17">17</xref>].</p>
        <p>Sentiment analysis in the health care setting is not a new phenomenon, for example, in previous research, greater positive sentiment within discharge summaries was associated with a significantly decreased risk of readmission [<xref ref-type="bibr" rid="ref18">18</xref>].</p>
      </sec>
      <sec>
        <title>This Study</title>
        <p>In the following subsections, we describe the specific characteristics and objectives of our study.</p>
        <sec>
          <title>Twitter Lists</title>
          <p>Previous studies have shown that topical experts are often the primary drivers of interesting discussions on Twitter [<xref ref-type="bibr" rid="ref19">19</xref>]. In contrast to random sampling for gathering Twitter data, alternative sampling methods have been put forward; one of them proposed to retrieve content only from topical experts, that is, Twitter users whose followers consider them to be knowledgeable on some topic, to reduce the number of unwanted tweets in the sampled data while still gathering useful tweets related to a specific topic. The key challenge, however, lies in identifying a good set of experts [<xref ref-type="bibr" rid="ref20">20</xref>].</p>
          <p>Twitter users can organize the accounts that they follow into Twitter user lists. These lists are used in a variety of ways. In some cases, they may correspond to personal lists of a given user’s friends and families, but frequently, lists are employed to group together Twitter accounts based on a common topic or theme. In this way, every Twitter user can effectively become a community curator. Therefore, previous research has proposed that we consider a Twitter user a “topical expert” if the user belongs to several lists on a particular topic [<xref ref-type="bibr" rid="ref20">20</xref>].</p>
          <p>In our study, we propose to take advantage of user lists in the field of stroke. To the best of our knowledge, lists have not been used in studies related to chronic health conditions.</p>
        </sec>
        <sec>
          <title>Plutchik’s Human Emotions</title>
          <p>Currently, there is no single accepted psychological theory of basic human emotions; nevertheless, there is an agreement that a simple positive-negative dichotomy is not enough to capture the full range of emotions [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
          <p>In this work, we use the Plutchik [<xref ref-type="bibr" rid="ref22">22</xref>] approach, which postulates the following eight basic human emotions: joy, sadness, anger, fear, trust, disgust, anticipation, and surprise. There have been extensive applications of this approach, for example, the National Research Council (NRC) Word-Emotion Association Lexicon, which contains 10,170 lexical items that are coded for Plutchik’s basic human emotions [<xref ref-type="bibr" rid="ref23">23</xref>], and has been applied in several sentiment analysis studies [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
          <p>Plutchik’s categories also have the advantage of providing a balanced list of positive (trust, joy, anger, and anticipation) and negative (disgust, sadness, fear, and surprise) emotions, which, to the best of our knowledge, have not been applied in chronic conditions, in general, or stroke, in particular.</p>
        </sec>
      </sec>
      <sec>
        <title>Hedonometer</title>
        <p>After performing emotional analysis based on Putchik’s model, we propose another point of view, by assigning happiness scores to tweets with the hedonometer tool. The hedonometer [<xref ref-type="bibr" rid="ref25">25</xref>] was developed from Twitter, Google Books, music lyrics, and the New York Times for measuring expressed happiness—positive and negative sentiment—in large-scale text corpora. Since its development, the hedonometer has been applied to studies on predictive markers of depression on Instagram [<xref ref-type="bibr" rid="ref26">26</xref>] or the climate change sentiment on Twitter [<xref ref-type="bibr" rid="ref27">27</xref>]. The hedonometer calculates a happiness score based on the happiness of the individual words used in the text. A total of 10,222 of the most frequently used English words in four disparate corpora were given happiness ratings using Amazon’s Mechanical Turk online marketplace.</p>
      </sec>
      <sec>
        <title>Adding Covariate Information With Structural Topic Models</title>
        <p>Although Latent Dirichlet Allocation (LDA) is, perhaps, the most common form of topic modeling, a number of associated techniques now exist, including dynamic topic models, correlated topic models, and hierarchical topic models. One of the most increasingly popular techniques to emerge in recent years, however, is structural topic modeling (STM). STM provides a flexible way to incorporate “metadata” associated with the text, such as when the text was written, where (eg, which country) it was written, who wrote it, and characteristics of the author, into the analysis using document-level covariates. In turn, it allows analysis of relationships between metadata and topics in the text corpus.</p>
      </sec>
      <sec>
        <title>Study Objectives</title>
        <p>As Brennan states [<xref ref-type="bibr" rid="ref13">13</xref>], the adjusting process involves huge amounts of emotional distress. This often leads to acute emotional difficulties such as feelings of confusion, loss, sadness, and anger. Considering that women experience more activity limitations, worse health-related quality of life, and more poststroke depression, in this study, we propose to take advantage of unobtrusive access to samples of spontaneously expressed emotions and opinions provided by Twitter and to analyze them from a gender perspective using two different, well-established approaches (Plutchik model and the hedonometer tool), with the following specific aims:</p>
        <list list-type="bullet">
          <list-item>
            <p>To compare tweets by gender of stroke survivor for the 8 basic emotions (anger, fear, anticipation, surprise, joy, sadness, trust, and disgust) while considering the raw frequencies of words in the collection of tweets posted by a stroke survivors’ sample.</p>
          </list-item>
          <list-item>
            <p>To determine the proportion of each emotion in the collection of tweets and statistically compare each of them by gender. This measurement thus allows us to track the proportion of each emotion for each individual tweet and is less affected by single outliers.</p>
          </list-item>
          <list-item>
            <p>To extract the main topics (represented as sets of words) that occur in the collection of tweets, related to each gender.</p>
          </list-item>
          <list-item>
            <p>To assign happiness scores to tweets and topics (using the hedonometer) and compare them by gender.</p>
          </list-item>
        </list>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Collection</title>
        <p>We considered the network analysis from previous research [<xref ref-type="bibr" rid="ref12">12</xref>] (see #Stroke in the Introduction) as the starting point. Node size is related to user influence, which is directly correlated to the amount a user is mentioned. The top identified nodes and their corresponding number of followers are as follows: @TheStrokeAssoc (102 million), @signagnststroke (68 million), @StrokeHope (93.8 million), @PeterCoghlan1 (7.2 million), @strokefdn (11.5 million), @StrokeAssocNW (5.5 million), @StrokeAHA_ASA (10.6 million), and @HeartandStroke (45.3 million), @HeartandStroke (45.3 million).</p>
        <p>Twitter data collection was performed using the <italic>rtweet</italic> R package [<xref ref-type="bibr" rid="ref28">28</xref>] via Twitter's REST (representational state transfer) and stream application program interfaces (APIs). We initially applied the <italic>lists_users</italic> function to obtain all lists that the top nodes subscribe to, including their own. Subsequently, we used the <italic>lists_members</italic> function to obtain Twitter list members (users on a given list). To retain a list member, we imposed the condition that it should appear in at least 3 different lists.</p>
        <p>For each identified user, we retrieved tweets with the get_timelines() function (it retrieves the most recent 3200 tweets for each Twitter user, without any time restriction). We collected 1,300,845 tweets from a thousand users and further classified them in tweets from particulars (woman or man) and from organizations (institutions and associations); the last step was to collect only tweets from particulars where the gender could be clearly determined, as explained in the next section.</p>
      </sec>
      <sec>
        <title>Participant Selection Process</title>
        <p>We modeled our data collection methods on prior studies that have used the Twitter platform for generating a convenience sample of users with publicly available accounts, who self-identify as stroke survivors in their profile or tweets.</p>
        <p>We then confirmed the self-reported stroke diagnosis by having one researcher generate this initial list of Twitter users and a second researcher check the details for each Twitter user on the list to ensure correct identification of stroke survivors users.</p>
        <p>We then employed a stepwise process for coding each Twitter user’s gender as male, female, or unknown/insufficient data. Two researchers independently used these codes, beginning with each Twitter user’s username, followed by profile name, profile description, profile photo, and tweets. Both researchers then reviewed their final gender codes for each Twitter user to ensure consistency and resolve disagreements.</p>
      </sec>
      <sec>
        <title>Data Cleaning</title>
        <p>The final sample was prepared for analysis by using the <italic>quanteda</italic> R package. This included the process of basic normalization (eg, remove punctuation and lowercase all text), stop word removal (eg, the words “a” and “the”), normalization of Twitter user mentions (eg, “@janedoe” is converted to “@user”), lemmatization (eg, “dog,” “dogs,” and “dog’s” are all converted to “dog”), and nonprintable character removal (eg, emojis). All analyses relied on public, anonymized data; adhered to the terms and conditions, terms of use, and privacy policies of Twitter; and were performed under Institutional Review Board approval from the authors’ institution.</p>
        <p>We do not report any specific tweets that could be used to identify the original Twitter user who posted the content online, as this is an important concern that has been discussed extensively in recent literature on the ethics of using Twitter data for research [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
      </sec>
      <sec>
        <title>Sentiment Analysis</title>
        <p>We calculated the overall frequencies of emotion words for each Plutchik category for each user (and therefore gender) by using the <italic>syuzhet</italic> R package [<xref ref-type="bibr" rid="ref30">30</xref>]. The NRC Word-Emotion Association Lexicon is available via open access and has been implemented in the get_nrc_sentiment() function of the <italic>syuzhet</italic> R package. Finally, the data were subjected to statistical analyses: For each tweet, given an emotion X, an emotion proportion score was calculated as:</p>
        <disp-formula><italic>proportion<sub>X</sub> = frequency of words with emotion X in a tweet / (frequency of negative words in a tweet + frequency of positive words in a tweet) (equation 1)</italic></disp-formula>
        <p>The emotion proportion scores for men and women were then subjected to a Wilcoxon rank sum test in R, since the <italic>F</italic>-test had revealed that the two distributions did not meet the criterion of variance homogeneity [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
      </sec>
      <sec>
        <title>Structural Topic Models</title>
        <p>Considering the final sample of tweets from the data cleaning phase presented above as the starting point, we proceeded as follows:</p>
        <list list-type="order">
          <list-item>
            <p>Convert cleaned tweets to tm corpus and create a term document matrix (TDM) using the <italic>tm</italic> R Package [<xref ref-type="bibr" rid="ref32">32</xref>].</p>
          </list-item>
          <list-item>
            <p>Calculate the term frequency inverse document frequency (TF-IDF) for all the words in TDM.</p>
          </list-item>
          <list-item>
            <p>Exclude all the words with TF-IDF≤0.1 to remove all the words that are less frequent.</p>
          </list-item>
          <list-item>
            <p>Calculate the optimal number of topics (K) in the corpus using the log-likelihood method for the calculated TDM using Gibbs sampling and exploring different metrics: “Griffiths2004,” “CaoJuan2009,” “Arun2010,” and “Deveaud2014” using the <italic>FindTopicsNumber</italic> function from the <italic>ldatuning</italic> R package [<xref ref-type="bibr" rid="ref33">33</xref>].</p>
          </list-item>
          <list-item>
            <p>Apply the spectral method using the <italic>stm</italic> package to discover topics.</p>
          </list-item>
          <list-item>
            <p>Topic validation (semantic coherence and exclusivity).</p>
          </list-item>
          <list-item>
            <p>Visualization and interpretation of results from the calculated model.</p>
          </list-item>
        </list>
        <p>A unique feature of STM, implemented by the <italic>stm</italic> R package [<xref ref-type="bibr" rid="ref34">34</xref>], is that it can model how the document level covariates affect the topical prevalence parameter μ with a generalized linear model. As mentioned in the Sentiment Analysis section above, our covariate is the gender factor with two levels (“Woman” and “Man”).</p>
        <p>Besides the inclusion of the gender covariate, the <italic>stm</italic> R package supports the explicit estimation of correlations among topics. This feature provides further information on the corpus structure. Correlations are estimated by replacing the Dirichlet distribution in the standard LDA framework with a logistic normal distribution as in the Correlated Topic Model [<xref ref-type="bibr" rid="ref35">35</xref>].</p>
        <p>This allows us to identify when two topics are likely to cooccur within tweets (here, we focus on both positive and negative correlations, which are also useful to identify gender differences).</p>
      </sec>
      <sec>
        <title>Hedonometer</title>
        <p>We applied the hedonometer tool to all tweets and to the main identified topics as follows: For each word in each tweet, we obtained a happiness score, calculated the mean happiness score for each day, and plotted it by date grouping by gender; STM allows us to identify the main topics and label the topics as “More likely Women” and “More likely Men.” As each topic is defined by a set of words, we obtained the happiness score of each word using the hedonometer, and therefore, we are able to compare topics according to their happiness score. This also allows us to select, for example, the top 25 words with the highest levels of happiness and identify if such words belong to female or male topics.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Sample Description</title>
        <p>After the selection process, a final sample of 479 Twitter users who posted 800,424 tweets between August 1, 2007, and December 1, 2018, were selected. Women (n=244) posted a total of 3,788,069 tweets; from them, we collected 396,898 tweets (the most recent ones, up to December 2018), and the mean number of tweets posted by our selected sample was 1620. In addition, 54% of the selected sample posted more than 1000 tweets and 71% posted more than 500 tweets. The total number of followers of the selected sample was 182,807.</p>
        <p>Men (n=235) posted a total of 1,469,364 tweets, from which we collected 403,526 tweets (the most recent ones, up to December 2018), and the mean number of tweets posted by our selected sample was 1717. In addition, 59% of the selected sample posted more than 1000 tweets and 73% posted more than 500 tweets. The total number of followers of the selected sample was 255,053.</p>
        <p><xref ref-type="fig" rid="figure1">Figure 1</xref> shows the date of the first and last posted tweets for each selected participant included in our sample (women in red, men in blue; same code colors throughout the analysis). Each vertical line in the plot represents a participant whose first tweet was posted at the top of the vertical line and last tweet was posted at the bottom of it. We ordered participants in the plot from left to right, where the earliest date of the first tweet is shown leftmost for each participant. For example, the leftmost participant is a man whose first tweet was posted in 2007 and last tweet was posted in 2014.</p>
        <fig id="figure1" position="float">
          <caption>
            <p>Topics and gender covariate obtained with spectral structural topic modeling.</p>
          </caption>
          <graphic xlink:href="jmir_v21i8e14077_fig1.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
        <p>In <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, we present the number of tweets posted by year; a larger number of tweets was posted in 2018 (about 300,000) and the other 500,000 posts were distributed with growing tendency since 2007, as presented in previous research (described in the #Stroke section).</p>
        <p>For each of the 479 participants, we reviewed their profiles to verify their geographic locations, obtained by means of the <italic>rtweet</italic> library. We were able to identify the geographic locations of 378 of the 479 users (78.91%).</p>
        <p>In <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, we present the total number of users (N=378) by country, showing that most of the users are from four countries: 95% are from Australia, Canada, the United Kingdom, or the United States.</p>
        <p>United States had the most users (206/378; 55%). The United Kingdom had 113 users (29.89%). As such, both countries together accounted for more than 85% of the participants.</p>
        <p>In <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, we present wordclouds of the top 500 words in all participants’ profile description. Most words are repeated in both wordclouds, but some distinctive characteristics can be observed (women clearly refer to Music, Live, and Time, while men do not).</p>
      </sec>
      <sec>
        <title>Sentiment Analysis</title>
        <p>The NRC Word-Emotion Association Lexicon, which contains 10,170 lexical items that are coded for Plutchik’s basic human emotions [<xref ref-type="bibr" rid="ref23">23</xref>] and implemented in the <italic>syuzhet</italic> R package, associates an emotion (or more than one emotion) to each of the 10,170 lexical items. Given a word and emotion X, the NRC Word-Emotion Association Lexicon associates a score (range: 0 to 1) with it. A score of 1 indicates that the word conveys the highest amount of emotion X. A score of 0 indicates that the word conveys the lowest amount of emotion X.</p>
        <p>We then identified (via the get_nrc_sentiment() function) the number of words that, according to the NRC, express positive or negative sentiment as well as one (or more than one) of Plutchik’s eight basic emotions.</p>
        <p><xref ref-type="table" rid="table1">Table 1</xref> summarizes the raw number of words (and their percentages) obtained with the get_nrc_sentiment() function of the <italic>syuzhet</italic> R package.</p>
        <p>Among both men and women, the most frequent emotions were trust, anticipation, and joy (top 3), as shown in <xref ref-type="fig" rid="figure2">Figure 2</xref>.</p>
        <p>Women used considerably more words from all positive categories (except anger), and men used more words in all negative categories (except surprise), as shown in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <p>When considering negative or positive words, women used 12% of negative words, while men used 13.6% of negative words. In contrast, women used 21.8% of positive words, while men used 20.5% of positive words. Positive and negative labels for words are also obtained from the NRC lexicon using the get_nrc_sentiment() function of the <italic>syuzhet</italic> R package.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Raw frequencies of words identified for each emotion.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="350"/>
            <col width="350"/>
            <col width="300"/>
            <thead>
              <tr valign="top">
                <td>Emotion</td>
                <td>Men, n (%)</td>
                <td>Women, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Anger</td>
                <td>76,650 (5.7)</td>
                <td>74,858 (5.4)</td>
              </tr>
              <tr valign="top">
                <td>Anticipation</td>
                <td>155,608 (11.6)</td>
                <td>166,150 (12.0)</td>
              </tr>
              <tr valign="top">
                <td>Disgust</td>
                <td>55,512 (4.1)</td>
                <td>54,785 (4.0)</td>
              </tr>
              <tr valign="top">
                <td>Fear</td>
                <td>117,221 (8.7)</td>
                <td>104,826 (7.6)</td>
              </tr>
              <tr valign="top">
                <td>Joy</td>
                <td>131,243 (9.8)</td>
                <td>161,933 (11.7)</td>
              </tr>
              <tr valign="top">
                <td>Sadness</td>
                <td>101,475 (7.6)</td>
                <td>89,868 (6.5)</td>
              </tr>
              <tr valign="top">
                <td>Surprise</td>
                <td>77,109 (5.7)</td>
                <td>83,663 (6.1)</td>
              </tr>
              <tr valign="top">
                <td>Trust</td>
                <td>170,0176 (12.7)</td>
                <td>178,718 (12.9)</td>
              </tr>
              <tr valign="top">
                <td>Negative</td>
                <td>182,288 (13.6)</td>
                <td>166,000 (12.0)</td>
              </tr>
              <tr valign="top">
                <td>Positive</td>
                <td>276,124 (20.5)</td>
                <td>300,751 (21.8)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Not applicable because .</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure2" position="float">
          <caption>
            <p>Ranking of emotions (in percentage of the total words. Men: left; women: right). Each bar represents the percentage of total words presented in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
          </caption>
          <graphic xlink:href="jmir_v21i8e14077_fig2.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
        <p>We then calculated the emotion proportion score for each emotion X, as shown in equation 1 in the Methods section.</p>
        <p><xref ref-type="table" rid="table2">Table 2</xref> reports statistical comparisons; for example, for the global positive emotion, women (median=100%, mean=65.57%) used considerably more positive words than men (median=66.67%, mean=60.73%). Since the <italic>F</italic>-test indicated that the two distributions have a significantly different variance (<italic>F</italic><sub>237040,242190</sub>=1.0468, <italic>P</italic>&lt;.001), they were subjected to a Wilcoxon rank sum test. This test showed that the difference between men and women is highly statistically significant (W=2.6817e+10, <italic>P</italic>&lt;.001). Similar results are shown in <xref ref-type="table" rid="table2">Table 2</xref> for global negative emotion: Men used considerably more negative words than women; in addition, each individual positive emotion (joy, anticipation, and trust, except surprise) was favorable to women and each individual negative emotion (fear, sadness, and disgust) was preferred by men.</p>
        <p>Global negative-positive proportion comparisons are presented in <xref ref-type="fig" rid="figure3">Figure 3</xref>. Women used considerably fewer negative words and more positive words than men (shown at the top and bottom of <xref ref-type="fig" rid="figure3">Figure 3</xref>, respectively)</p>
        <p>Plutchik’s eight emotions are subdivided into four complementary pairs, namely, joy–sadness, anticipation–surprise, trust–disgust, and anger–fear [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Statistical comparison of words identified for each emotion.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="190"/>
            <col width="120"/>
            <col width="120"/>
            <col width="220"/>
            <col width="100"/>
            <col width="120"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Emotion, participants</td>
                <td>Median</td>
                <td>Mean</td>
                <td><italic>F (df)</italic></td>
                <td><italic>P</italic> value</td>
                <td>W</td>
                <td><italic>P</italic> value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="4">
                  <bold>Joy</bold>
                </td>
                <td>0.9030 (237040,242190)</td>
                <td>&lt;.001</td>
                <td>2.63e+10</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td>0</td>
                <td>0.2972</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td>0</td>
                <td>0.3611</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Negative</bold>
                </td>
                <td>1.0468 (237040,242190)</td>
                <td>&lt;.001</td>
                <td>3.05e+10</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td>0.3333</td>
                <td>0.3927</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td>0</td>
                <td>0.3443</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Fear</bold>
                </td>
                <td>1.1183 (237040,242190)</td>
                <td>&lt;.001</td>
                <td>3.01e+10</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td>0</td>
                <td>0.2481</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td>0</td>
                <td>0.2121</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Positive</bold>
                </td>
                <td>1.0468 (237040,242190)</td>
                <td>&lt;.001</td>
                <td>2.68e+10</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td>0.6667</td>
                <td>0.6073</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td>1.0000</td>
                <td>0.6557</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Sadness</bold>
                </td>
                <td>1.0261 (237040,242190)</td>
                <td>&lt;.001</td>
                <td>2.45e+10</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td>0</td>
                <td>0.2204</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td>0</td>
                <td>0.1868</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Anger</bold>
                </td>
                <td>1.0399 (237040,242190)</td>
                <td>&lt;.001</td>
                <td>2.90e+10</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td>0</td>
                <td>0.1573</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td>0</td>
                <td>0.1495</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Anticipation</bold>
                </td>
                <td>0.9837 (237040,242190)</td>
                <td>&lt;.001</td>
                <td>2.79e+10</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td>0</td>
                <td>0.3299</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td>0</td>
                <td>0.3488</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Surprise</bold>
                </td>
                <td>1 (237040,242190)</td>
                <td>&gt;.99</td>
                <td>N/A<sup>b</sup></td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td>0</td>
                <td>0.1672</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td>0</td>
                <td>0.1779</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Trust</bold>
                </td>
                <td>1.0134 (237040,242190)</td>
                <td>&lt;.001</td>
                <td>2.81e+10</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td>0.1667</td>
                <td>0.3628</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td>0.2500</td>
                <td>0.3755</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Disgust</bold>
                </td>
                <td>1.0559 (237040,242190)</td>
                <td>&lt;.001</td>
                <td>2.88e+10</td>
                <td>&lt;.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Men</td>
                <td>0</td>
                <td>0.1153</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Women</td>
                <td>0</td>
                <td>0.1109</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
                <td>—</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure3" position="float">
          <caption>
            <p>Topics and gender covariate obtained with spectral structural topic modeling.</p>
          </caption>
          <graphic xlink:href="jmir_v21i8e14077_fig3.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
        <p><xref ref-type="fig" rid="figure4">Figure 4</xref> plots such scores for each emotion summarized monthly along all the time periods in the study of emotion words for each pair of emotions, obtained with <italic>syuzhet</italic> R package and plotted with the <italic>ggplot2</italic> R package. It clearly shows higher scores for women in positive emotions along time and lower scores for men in almost every emotions throughout the considered period.</p>
        <p>As shown in <xref ref-type="fig" rid="figure4">Figure 4</xref>, joy and global positive words clearly present higher values for women throughout the considered period.</p>
        <fig id="figure4" position="float">
          <caption>
            <p>Monthly mean scores for NRC emotions in the 2008-2018 period.</p>
          </caption>
          <graphic xlink:href="jmir_v21i8e14077_fig4.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Assigning Happiness Scores With the Hedonometer</title>
        <p>We then calculated the happiness score using the hedonometer for each word in each tweet, summarized the mean happiness score for each day during the whole period under study, and plotted it by date, grouping by gender.</p>
        <p>As shown in <xref ref-type="fig" rid="figure5">Figure 5</xref>, happiness ratings obtained by hedonometer summarized on a daily basis for each user are also higher for women than for men, almost throughout the considered time period, with remarkable differences in favor of women, for example, in the 2013-2014 period, 2016, and 2018.</p>
        <fig id="figure5" position="float">
          <caption>
            <p>Topics and gender covariate obtained with spectral structural topic modeling.</p>
          </caption>
          <graphic xlink:href="jmir_v21i8e14077_fig5.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Structured Topic Modelling</title>
        <p>Before the application of STM, we performed an exploratory cluster analysis using VosViewer [<xref ref-type="bibr" rid="ref36">36</xref>]. As defined by VosViewer, a term map is a two-dimensional representation, in which strongly related terms are located close to each other and less strongly related terms are located further away from each other. Each point in a term map has a color that depends on the density of items at that point. It is argued that the VOS mapping technique yields more satisfactory term maps than popular multidimensional scaling–based approaches to bibliometric mapping. Maps constructed using these multidimensional scaling–based approaches are shown to suffer from certain artifacts. Maps constructed using the VOS mapping technique do not have this problem, as reported by Waltman et al [<xref ref-type="bibr" rid="ref36">36</xref>]. Details are presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> (VosViewer Cluster Analysis).</p>
        <p>We tested different parameter configurations to increase intercluster distances and reduce intracluster distances. VosViewer allowed us to identify seven clusters for men and five clusters for women (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). In the obtained clusters for the most relevant 250 words for men and women, we highlighted words that are common to clusters obtained by men and women. Unfortunately, this is the case for most of the words; therefore, it did not allow us to visually identify gender differences.</p>
        <p>Nevertheless, in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, we present the clusters for the words that are not common to both men and women, and we applied the hedonometer to each of them; the happiness scores are shown in brackets for each word.</p>
        <p>We summarized the happiness scores and obtained mean happiness scores of 5.31 (SD 1.31) for all the words present only in men clusters and 6.25 (SD 1.07) for those present only in women clusters. We then considered each of the largest clusters separately and obtained the following for men: mean happiness score in cluster 1=5.52 (SD 0.99) and mean happiness score in cluster 2=5.06 (SD 1.25). For women, the mean happiness score was 6.30 (SD 1.12) in cluster 1, 5.70 (SD 1.13) in cluster 2, and 6.68 (SD 0.81) in cluster 3. Again, happiness scores of women were higher than those of men when considering the scores at the cluster level.</p>
        <p>Before STM, we also performed LDA analysis for seven topics; the number of topics was determined as shown in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> by using different metrics and the FindTopicsNumber function from the <italic>ldatuning</italic> R package.</p>
        <p>The obtained topics are presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, but as with cluster analysis, we could not identify topics clearly related to men or women.</p>
        <p>Therefore, we applied STM to associate covariates (Gender) to the identified topics and plot results as presented in <xref rid="figure6" ref-type="fig">Figure 6</xref>. As with most topic models, the objective function maximized by STM is multimodal. Therefore, the way we choose the starting values for the variational EM algorithm can affect our final solution.</p>
        <fig id="figure6" position="float">
          <caption>
            <p>Topics and gender covariate obtained with spectral structural topic modeling.</p>
          </caption>
          <graphic xlink:href="jmir_v21i8e14077_fig6.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
        <p>We applied LDA initialization (the default option), which uses several passes of collapsed Gibbs sampling to initialize the algorithm.</p>
        <p><xref ref-type="table" rid="table3">Table 3</xref> shows the top three topics selected for men and women, with 3 different types of word profiles: highest probability, frequency-exclusivity (FREX), and score values. Detailed descriptions of all identified topics are presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <p>FREX measures exclusivity of the words to the topic in a way that balances it with word frequency. The score metric divides the log frequency of the word in the topic by the log frequency of the word in other topics, and highest probability considers words within each topic with the highest probability, inferred directly from topic-word distribution.</p>
        <p>In <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, we present the evaluation of the obtained topics. Semantic coherence is a criterion developed by Mimno and colleagues [<xref ref-type="bibr" rid="ref37">37</xref>]; it is maximized when the most probable words in a given topic frequently cooccur together, and it has been shown that the semantic coherence metric correlates well with human judgment of topic quality [<xref ref-type="bibr" rid="ref37">37</xref>].</p>
        <p>Topics 19, 17, and 10 show all semantic coherence values to the right side of the plot, with topic 19 to the rightmost possible position and close to topic 10. Topics 1, 6, and 3 are in the central positions, while upper right side positions are six optimal selected topics showing acceptable values.</p>
        <p>We then assigned happiness scores to topics with the hedonometer tool (we proceeded as was done with VosViewer clusters described in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). As shown in <xref rid="figure6" ref-type="fig">Figure 6</xref>, STM allows us to label the topics as “More likely Women” and “More likely Men.”</p>
        <p>As presented in <xref ref-type="table" rid="table3">Table 3</xref>, each topic is defined as a list of 20 words. To assign happiness scores, we selected the words with the highest probability (first row of each topic in <xref ref-type="table" rid="table3">Table 3</xref>). Therefore, we applied the hedonometer tool to assign a happiness score to each word with the highest probability of each topic.</p>
        <p>In the <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, we present the complete list of all words defining each topic. For each word, we present the happiness score and its corresponding topic (and therefore the associated gender to the topic). We selected a subset of these words (<xref ref-type="table" rid="table4">Tables 4</xref> and <xref ref-type="table" rid="table5">5</xref>). We show the 25 words with the highest happiness scores and those with the lowest happiness scores along with the corresponding gender.</p>
        <p><xref ref-type="table" rid="table4">Table 4</xref> shows that 19 of the 25 words with the highest happiness scores correspond to women’s topics and only 6 correspond to men’s topics. <xref ref-type="table" rid="table5">Table 5</xref> shows the 25 words with the lowest happiness scores, and only 7 corresponded to women, while 18 corresponded to men.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Top three identified topics and percentages for women (topics 1, 3,6) and men (topics 10,17,19).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="100"/>
            <col width="300"/>
            <col width="300"/>
            <col width="300"/>
            <thead>
              <tr valign="bottom">
                <td>Topic (%)</td>
                <td>Highest probability</td>
                <td>FREX<sup>a</sup></td>
                <td>Score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1 (5.23)</td>
                <td>year, happy, tomorrow, open, birthday, take, come, busy, christmas, baby, sleep, friday, sunday, monday, list, bed, smile, market, treat, guess</td>
                <td>merri, birthday, appl, ang, eve, awak, con, clay, decemb, angel, happi, est, syracus, ako, relax, closet, lang, store, carousel</td>
                <td>happi, year, birthday, tomorrow, open, christma, sleep, friday, come, busi, babi, sunday, take, bed, store, monday, holiday, list, date, market</td>
              </tr>
              <tr valign="top">
                <td>3 (7.21)</td>
                <td>good, great, video, hope, night, morn, lol, tonight, long, done, head, weekend, fun, readi, celebrate, citi, movie, luck, earli, forget</td>
                <td>playlist, chicken, grill, peter, egg, chees, movi, delici, potato, cooki, bbq, soup, recip, video, kitti, cup, chili, luck, pan, belli</td>
                <td>good, video, hope, night, morn, great, lol, weekend, playlist, movi, tonight, don, luck, fun, long, sweet, forget, gonna, saturday, dinner</td>
              </tr>
              <tr valign="top">
                <td>6 (5.73)</td>
                <td>time, life, thing, world, god, famili, twitter, hear, power, hate, pass, speak, human, step, posit, bless, super, continu, messag, creat</td>
                <td>god, lord, pray, faith, amen, bless, prayer, psalm, soul, negat, holi, heal, thank, charl, nchousingbuild, merci, evil, accomplish, yea, compass</td>
                <td>time, god, thing, life, famili, twitter, world, lord, bless, hear, power, step, super, hate, pray, prayer, congrat, pop, faith, posit</td>
              </tr>
              <tr valign="top">
                <td>10 (3.82)</td>
                <td>end, heart, walk, news, stop, run, hand, pay, mile, rate, worth, success, dead, offer, singl, reach, staff, fail, snow, hero</td>
                <td>mile, rate, bpm, attitud, anthem, bioness, hawk, failur, shoulder, flaw, casual, complic, tattoo, zombi, hero, pinterest, hand, virus, vancouv</td>
                <td>heart, walk, end, news, mile, stop, run, rate, bpm, hand, pay, dead, success, attitud, hero, snow, worth, bbc, offer, reach</td>
              </tr>
              <tr valign="top">
                <td>17 (5.25)</td>
                <td>back, play, game, team, job, place, boy, man, point, won, lost, black, park, perfect, act, lose, john, footbal, film, player</td>
                <td>yard, hole, playoff, player, joe, nfl, eagl, cowboy, bronx, kiss, dalla, theater, doodl, lewi, cunt, throw, golden, barn, korea, brave</td>
                <td>game, team, play, back, boy, job, footbal, player, park, perfect, black, act, place, north, beat, test, film, lose, tour, kick</td>
              </tr>
              <tr valign="top">
                <td>19 (6.25)</td>
                <td>stroke, support, find, survivor, learn, lot, brain, care, health, patient, help, aware, money, raise, children, research, import, risk, experience, hospital</td>
                <td>aware, raise, foundat, risk, research, patient, region, medic, lot, recoveri, donat, increas, factor, studi, resourc, rehab, treatment, cancer, rehabilit, learn</td>
                <td>stroke, survivor, learn, lot, find, support, brain, patient, awar, care, rais, health, research, risk, foundat, injuri, studi, region, recoveri, disease</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>FREX: frequency-exclusivity.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Top 25 words with highest happiness scores, topics, and gender of participants.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Word</td>
                <td>Participant</td>
                <td>Score</td>
                <td>Topic</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Love</td>
                <td>Women</td>
                <td>8.42</td>
                <td>T16</td>
              </tr>
              <tr valign="top">
                <td>Happy</td>
                <td>Women</td>
                <td>8.3</td>
                <td>T1</td>
              </tr>
              <tr valign="top">
                <td>Win</td>
                <td>Women</td>
                <td>8.12</td>
                <td>T15</td>
              </tr>
              <tr valign="top">
                <td>Smile</td>
                <td>Women</td>
                <td>8.1</td>
                <td>T1</td>
              </tr>
              <tr valign="top">
                <td>Won</td>
                <td>Men</td>
                <td>8.1</td>
                <td>T17</td>
              </tr>
              <tr valign="top">
                <td>Music</td>
                <td>Women</td>
                <td>8.02</td>
                <td>T2</td>
              </tr>
              <tr valign="top">
                <td>Weekend</td>
                <td>Women</td>
                <td>8.0</td>
                <td>T3</td>
              </tr>
              <tr valign="top">
                <td>Celebrate</td>
                <td>Women</td>
                <td>7.98</td>
                <td>T3</td>
              </tr>
              <tr valign="top">
                <td>Christmas</td>
                <td>Women</td>
                <td>7.96</td>
                <td>T1</td>
              </tr>
              <tr valign="top">
                <td>Fun</td>
                <td>Women</td>
                <td>7.96</td>
                <td>T3</td>
              </tr>
              <tr valign="top">
                <td>Free</td>
                <td>Men</td>
                <td>7.96</td>
                <td>T11</td>
              </tr>
              <tr valign="top">
                <td>Great</td>
                <td>Women</td>
                <td>7.88</td>
                <td>T3</td>
              </tr>
              <tr valign="top">
                <td>Success</td>
                <td>Men</td>
                <td>7.86</td>
                <td>T10</td>
              </tr>
              <tr valign="top">
                <td>Award</td>
                <td>Women</td>
                <td>7.86</td>
                <td>T15</td>
              </tr>
              <tr valign="top">
                <td>Positive</td>
                <td>Women</td>
                <td>7.8</td>
                <td>T6</td>
              </tr>
              <tr valign="top">
                <td>Hero</td>
                <td>Men</td>
                <td>7.8</td>
                <td>T10</td>
              </tr>
              <tr valign="top">
                <td>Sun</td>
                <td>Men</td>
                <td>7.8</td>
                <td>T11</td>
              </tr>
              <tr valign="top">
                <td>Birthday</td>
                <td>Women</td>
                <td>7.78</td>
                <td>T1</td>
              </tr>
              <tr valign="top">
                <td>Winner</td>
                <td>Women</td>
                <td>7.78</td>
                <td>T15</td>
              </tr>
              <tr valign="top">
                <td>Beauty</td>
                <td>Men</td>
                <td>7.76</td>
                <td>T5</td>
              </tr>
              <tr valign="top">
                <td>Family</td>
                <td>Women</td>
                <td>7.72</td>
                <td>T6</td>
              </tr>
              <tr valign="top">
                <td>Gift</td>
                <td>Women</td>
                <td>7.72</td>
                <td>T15</td>
              </tr>
              <tr valign="top">
                <td>Brilliant</td>
                <td>Women</td>
                <td>7.68</td>
                <td>T2</td>
              </tr>
              <tr valign="top">
                <td>Super</td>
                <td>Women</td>
                <td>7.68</td>
                <td>T6</td>
              </tr>
              <tr valign="top">
                <td>Amazing</td>
                <td>Women</td>
                <td>7.66</td>
                <td>T16</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Top 25 words with the lowest happiness scores, topics, and gender of participants.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Word</td>
                <td>Participant</td>
                <td>Score</td>
                <td>Topic</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Death</td>
                <td>Men</td>
                <td>1.54</td>
                <td>T18</td>
              </tr>
              <tr valign="top">
                <td>Kill</td>
                <td>Women</td>
                <td>1.56</td>
                <td>T12</td>
              </tr>
              <tr valign="top">
                <td>Die</td>
                <td>Men</td>
                <td>1.74</td>
                <td>T18</td>
              </tr>
              <tr valign="top">
                <td>Fail</td>
                <td>Men</td>
                <td>1.96</td>
                <td>T10</td>
              </tr>
              <tr valign="top">
                <td>Dead</td>
                <td>Men</td>
                <td>2.0</td>
                <td>T10</td>
              </tr>
              <tr valign="top">
                <td>Pain</td>
                <td>Men</td>
                <td>2.1</td>
                <td>T4</td>
              </tr>
              <tr valign="top">
                <td>Hell</td>
                <td>Men</td>
                <td>2.22</td>
                <td>T9</td>
              </tr>
              <tr valign="top">
                <td>Poor</td>
                <td>Men</td>
                <td>2.32</td>
                <td>T9</td>
              </tr>
              <tr valign="top">
                <td>Hate</td>
                <td>Women</td>
                <td>2.34</td>
                <td>T6</td>
              </tr>
              <tr valign="top">
                <td>Sad</td>
                <td>Women</td>
                <td>2.38</td>
                <td>T12</td>
              </tr>
              <tr valign="top">
                <td>Attack</td>
                <td>Men</td>
                <td>2.42</td>
                <td>T8</td>
              </tr>
              <tr valign="top">
                <td>Shot</td>
                <td>Women</td>
                <td>2.5</td>
                <td>T2</td>
              </tr>
              <tr valign="top">
                <td>Shit</td>
                <td>Men</td>
                <td>2.5</td>
                <td>T18</td>
              </tr>
              <tr valign="top">
                <td>Aphasia</td>
                <td>Men</td>
                <td>2.58</td>
                <td>T11</td>
              </tr>
              <tr valign="top">
                <td>Stroke</td>
                <td>Men</td>
                <td>2.58</td>
                <td>T19</td>
              </tr>
              <tr valign="top">
                <td>Lie</td>
                <td>Men</td>
                <td>2.6</td>
                <td>T13</td>
              </tr>
              <tr valign="top">
                <td>Bad</td>
                <td>Women</td>
                <td>2.64</td>
                <td>T16</td>
              </tr>
              <tr valign="top">
                <td>Fight</td>
                <td>Women</td>
                <td>2.7</td>
                <td>T16</td>
              </tr>
              <tr valign="top">
                <td>Lost</td>
                <td>Men</td>
                <td>2.76</td>
                <td>T17</td>
              </tr>
              <tr valign="top">
                <td>Lose</td>
                <td>Men</td>
                <td>2.76</td>
                <td>T17</td>
              </tr>
              <tr valign="top">
                <td>Disabled</td>
                <td>Men</td>
                <td>2.82</td>
                <td>T18</td>
              </tr>
              <tr valign="top">
                <td>Problem</td>
                <td>Men</td>
                <td>2.98</td>
                <td>T4</td>
              </tr>
              <tr valign="top">
                <td>Wrong</td>
                <td>Men</td>
                <td>3.14</td>
                <td>T18</td>
              </tr>
              <tr valign="top">
                <td>Forget</td>
                <td>Women</td>
                <td>3.22</td>
                <td>T3</td>
              </tr>
              <tr valign="top">
                <td>Cut</td>
                <td>Men</td>
                <td>3.42</td>
                <td>T9</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>We then calculated the boxplots of the happiness scores for each topic (<xref ref-type="fig" rid="figure7">Figure 7</xref>), ordered from “More Likely Men” to “More Likely Women”; the means and regression line are shown in red circles and a red line, respectively (<italic>P</italic>&lt;.001).</p>
        <p><xref ref-type="fig" rid="figure7">Figure 7</xref> shows higher happiness scores from Topic 4 to the right (ie, women’s topics) with the exception of Topic 16, which contains several words with low happiness scores (eg, “bad” or “lone”; <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The regression line shows a positive slope in the direction of women’s topics (<italic>P</italic>&lt;.001).</p>
        <p>We then compared happiness scores by pairs from the leftmost and rightmost topics in <xref rid="figure6" ref-type="fig">Figure 6</xref> to the center (Topic 19-Topic 1, Topic 17-Topic 6, Topic 10-Topic 3, etc). We found significant differences in favor of women in 4 of the 10 pairs of topics (and none in favor of men) when comparing the happiness scores by pairs of topics (<xref ref-type="fig" rid="figure8">Figure 8</xref>; men blue, women red). The complete list of comparisons is presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <p>STM also permits correlations between topics. Positive correlations indicate that both topics are likely to be discussed in a tweet. In <xref ref-type="fig" rid="figure9">Figure 9</xref>, we plot both positive and negative correlations for all identified topics.</p>
        <p>Topic 1 shows the highest positive correlation with Topic 3. This can be further confirmed in <xref ref-type="table" rid="table3">Table 3</xref>, as both topics address actual positive everyday life situations like celebrations (birthday, Christmas, holiday, merry), and Topic 1 was strongly negatively correlated with Topic 19, which refers to research, studies, risks, factors, hospital, disease, stroke, and care.</p>
        <p>Topic 3, therefore, is also strongly negatively correlated with Topic 19 and Topic 10.</p>
        <p>Topic 10 refers to running, beats per minute, heart rate, attitude, stop, walk, and reach, while Topic 3 refers to fun, celebrate, movie, Saturday, dinner, barbeque, chicken, grill, egg, cheese, delicious, potato, and cooking. Topic 6 addresses religion—god, lord, pray, faith, amen, bless, prayer, psalm, soul—while Topic 17 addresses sports—playoff, nfl, game, yard, football, player—showing clear differences in topics of interest addressed by men and women.</p>
        <fig id="figure7" position="float">
          <caption>
            <p>Topics and gender covariate obtained with spectral structural topic modeling.</p>
          </caption>
          <graphic xlink:href="jmir_v21i8e14077_fig7.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure8" position="float">
          <caption>
            <p>Topics and gender covariate obtained with spectral structural topic modeling.</p>
          </caption>
          <graphic xlink:href="jmir_v21i8e14077_fig8.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure9" position="float">
          <caption>
            <p>Topics and gender covariate obtained with spectral structural topic modeling.</p>
          </caption>
          <graphic xlink:href="jmir_v21i8e14077_fig9.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this work, we proposed the application of Twitter lists to a chronic health condition in a GNU framework (R-3.5.1). We applied a set of publicly available R libraries for collecting and organizing Twitter data via Twitter’s REST and stream API (<italic>rtweet</italic>), sentiment analysis (<italic>syuzhet</italic>), text mining (<italic>tm, quanteda</italic>), and structural topic model (<italic>stm</italic>). We also applied the hedonometer tool to assign happiness scores to topics by gender.</p>
        <p>According to our findings, men use significantly more words while expressing negative emotions in their tweets than women, while women use significantly more words when expressing positive emotions.</p>
        <p>The results also show that the top three most frequent emotions evoked by both men and women are trust, anticipation, and joy. Besides, the statistical analysis of the basic emotions detects significant preferences for each gender: While words from the emotional fields of trust, anticipation, and joy appear significantly more often in women’s tweets, men’s tweets significantly exhibit a preference for evoking disgust, anger, fear, and sadness.</p>
        <p>We also applied another tool that was specifically designed for considering Twitter inputs—the hedonometer. Happiness ratings obtained by the hedonometer, summarized on a daily basis for each user, are also higher for women than for men almost all along the considered time period.</p>
        <p>Finally, we applied structural topic modelling (to the best of our knowledge, for the first time to a chronic health condition) to identify main topics addressed by gender and determined positive and negative correlations between topics by gender.</p>
        <p>Topics in this context are defined as sets of words; therefore, we assigned happiness scores to the words with highest probabilities in the identified topics and found that the topics women talk about show higher happiness scores than the topics addressed by men.</p>
        <p>A common stereotype in both Western and Eastern cultures suggests that women are more emotional than men, particularly when responding to negative emotions [<xref ref-type="bibr" rid="ref38">38</xref>]. As remarked in the Introduction section, after stroke, women experience more activity limitations, worse health-related quality of life, and more poststroke depression than men [<xref ref-type="bibr" rid="ref7">7</xref>] and are twice as likely to suffer from severe depression following a stroke than men. We identify several explanations for our findings, listed below.</p>
        <p>First, according to Ayis et al [<xref ref-type="bibr" rid="ref8">8</xref>], women draw larger components of their sense of self and self-worth from interpersonal relationships and networks, and they are more sensitive to adversities of these. Therefore, female stroke survivors may experience (to a larger extent in comparison to men) the interpersonal and intrapersonal benefits of sharing positive events and emotions on social network sites (SNSs). The intrapersonal benefits of sharing positive events and emotions on SNSs consist of re-experiencing and prolonging these positive events; the interpersonal benefits comprise positive social interaction and positive feedback from other SNS users (according to the results of an ethnographic diary study on Facebook use from Sas et al [<xref ref-type="bibr" rid="ref39">39</xref>]).</p>
        <p>Second, prior research indicates that the positivity of self-presentation on SNSs has an influence on both the quantity and quality of reactions from other SNS contacts. For example, Utz [<xref ref-type="bibr" rid="ref40">40</xref>] found that SNS users were least likely to receive reactions from their online friends when they expressed sadness in their postings. Similarly, Forest and Wood [<xref ref-type="bibr" rid="ref41">41</xref>] demonstrated that more positive status updates on Facebook received more positive and favorable feedback from friends than negative status updates.</p>
        <p>A third explanation to our findings can be related to the existence of “the positivity bias in SNS communication,” which states that “while the SNS environment generally enables authentic self-presentation, it favors positive forms of authenticity over the presentation of negative aspects of the true self” [<xref ref-type="bibr" rid="ref42">42</xref>].</p>
        <p>Therefore, according to Reinecke et al, due to the positivity bias in SNS communication, individuals with higher levels of psychological well-being have a higher chance of experiencing authenticity through the use of SNSs than SNS users with low psychological well-being.</p>
        <p>The fourth explanation is related to a recent Facebook analysis involving 15,000 users [<xref ref-type="bibr" rid="ref43">43</xref>]. The authors concluded that “language used more by self-identified females was interpersonally warmer, more compassionate, polite, and—contrary to previous findings—slightly more assertive in their language use, whereas language used more by self-identified males was colder, more hostile, and impersonal.” In fact, the following text from their publication, can also be applied to our own findings:</p>
        <disp-quote><p>The most strongly female-linked topics included words describing positive emotions (e.g., “excited”, “happy”, “&lt;3”, “love”,), social relationships (e.g., “friends”, “family”, “sister”), and intensive adverbs (e.g., “sooo”, “sooooo”, “ridiculously”). Strongly male-linked topics included words related to politics (e.g., “government”, “tax”, “political”), sports and competition (e.g.,“football”, “season”, “win”, “battle”), and specific interests or activities, such as shooting guns, playing musical instruments, or playing video games.</p></disp-quote>
        <p>Therefore, according to this fourth explanation, our findings in another SNS such as Twitter are similar to those involving users not necessarily identified as stroke survivors on Facebook.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>The collected sample was not intended to be representative or a comprehensive set of all tweets posted by stroke survivors during the period under study. Although the collected data also included tweets directed at other users (ie, conversational tweets), the results cannot be considered to reflect all topics of conversation appearing in Twitter for stroke survivors.</p>
        <p>Data collection relied on Twitter’s streaming API, which prevents collection of tweets from private Twitter accounts. As a result, findings may not represent individuals with private accounts.</p>
        <p>Furthermore, recent analysis [<xref ref-type="bibr" rid="ref44">44</xref>] shows that 62% of all Twitter users are less than 49 years old; our participants are skewed toward such an age range, and most of them from the United States.</p>
        <p>Nevertheless, as discussed in the Introduction section, multiple recent studies have reported a sustained increasing incidence of stroke at younger ages and the included participants were randomly selected after checking their membership to several Twitter stroke–related lists and manually double checked in relation to gender and stroke survivor condition.</p>
        <p>We analyzed women (n=244) who posted a total of 3,788,069 tweets. From them, we included 396,898 tweets in our analysis (the most recent ones, up to December 2018); therefore, we analyzed 10.5% of all posted tweets by women participating in this study.</p>
        <p>We analyzed men (n=235) who posted a total of 1,469,364 tweets. From them, we included 403,526 tweets in our analysis (the most recent ones, up to December 2018). Therefore, we analyzed 27.4% of all posted tweets by men participating in this study.</p>
        <p>The total number of tweets posted by women from whom we extracted our sample is clearly larger than tweets posted by men. This seems to be coincidental with general Twitter use statistics: Women are usually more active, and each month, 40 million more women than men visit Twitter [<xref ref-type="bibr" rid="ref45">45</xref>].</p>
        <p>Other relevant factors to be mentioned as limitations to our study are related to geographic location, spatial trajectory, or the time of the day a tweet has been posted. As remarked by Padilla et al [<xref ref-type="bibr" rid="ref46">46</xref>] and Gore et al [<xref ref-type="bibr" rid="ref47">47</xref>], such factors may affect tweets’ sentiments. We observed that 85% of our participants profiles are from the United Kingdom and United States, but spatiotemporal aspects are not controlled in our study.</p>
        <p>Finally, the individual psychological differences that stroke survivors may experience must also be mentioned. Certain individuals might have personality traits that make them more predisposed to positive or negative sentiments. The degree to which sentiment reflects variance in psychological traits versus the situational context in which those traits were expressed is unclear. Possible users affected by severe depression may not be active on Twitter; this could be a source for another significant bias in the data sample.</p>
      </sec>
      <sec>
        <title>Comparison with Prior Work</title>
        <p>One of the scarce previous research about tweet topics or sentiment analysis on chronic health conditions was recently conducted by Brunner and colleagues [<xref ref-type="bibr" rid="ref48">48</xref>]. Tweets tagged with traumatic brain injury (TBI)-related hashtags were harvested over a one-month period in 2016 and analyzed qualitatively and quantitatively. A total of 29,199 tweets included tweets sent by 893 users, 219 of whom had a brain injury. Twitter was used to discuss health issues, raise awareness of TBI, talk about life after TBI, talk about sport and concussion, and communicate inspirational messages.</p>
        <p>In relation to depression, Lachmar and colleagues [<xref ref-type="bibr" rid="ref49">49</xref>] captured 3225 original tweets for the hashtag #MyDepressionLooksLike that circulated in May 2016. Cleaning resulted in a total of 1978 tweets. Using qualitative content analysis revealed seven themes: dysfunctional thoughts, lifestyle challenges, social struggles, hiding behind a mask, apathy and sadness, suicidal thoughts and behaviors, and seeking relief. Contrary to Lachmar and colleagues' [<xref ref-type="bibr" rid="ref49">49</xref>] analysis or the #Stroke analysis (the one presented in the Introduction section), our analysis is not linked to a specific hashtag.</p>
        <p>It is important to remark the need for further research from a gender perspective, as promoted by initiatives such as the Women’s Brain Project [<xref ref-type="bibr" rid="ref50">50</xref>].</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study explored emotional expressivity for eight specific types of emotion and identified 20 main topics of interest through Twitter posts in stroke survivors from a gender perspective. Numerous studies have shown that, compared with men, women usually experience more frequent and stronger negative emotions. Nevertheless, our results show that men present more frequent and stronger negative emotions in their tweets, when considering both globally positive-negative or individual tweets and analyzing them using two different well-established approaches: the Plutchik model and the hedonometer tool.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Demographics, wordclouds, VosViewer cluster analysis, latent Dirichlet allocation topics, correlation analysis, STM topics, hedonometer scores, and the Plutchik psychoevolutionary model.</p>
        <media xlink:href="jmir_v21i8e14077_app1.pdf" xlink:title="PDF File (Adobe PDF File), 2 MB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">API</term>
          <def>
            <p>application program interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">EM</term>
          <def>
            <p>expectation maximization</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">FREX</term>
          <def>
            <p>frequency-exclusivity</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">HRQoL</term>
          <def>
            <p>health-related quality of life</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">LDA</term>
          <def>
            <p>latent Dirichlet allocation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">NRC</term>
          <def>
            <p>National Research Council</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">REST</term>
          <def>
            <p>representational state transfer</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">SNS</term>
          <def>
            <p>social network site</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">STM</term>
          <def>
            <p>structural topic modeling</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">TDM</term>
          <def>
            <p>term document matrix</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">TF-IDF</term>
          <def>
            <p>term frequency – inverse document frequency</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This research was partially funded by EU H2020 PRECISE4Q - Personalized Medicine by Predictive Modeling in Stroke for better Quality of Life (Grant Agreement 777107 – Research and Innovation Action).</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>AG-R and SL conceived the study. AG-R, JS, and SL collected, selected, and cleaned the data. AG-R and JS analyzed the data. AG-R drafted the initial manuscript. SL, JS, and MBG revised the manuscript critically for important intellectual content and approved the final manuscript. AG-R, SL, JS, and MBG received funding for the study.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Onuma</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Owolabi</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <source>Bulletin of the World Health Organization</source>
          <year>2016</year>
          <access-date>2019-07-22</access-date>
          <comment>Stroke: a global response is needed 
          <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/bulletin/volumes/94/9/16-181636.pdf">https://www.who.int/bulletin/volumes/94/9/16-181636.pdf</ext-link></comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Béjot</surname>
              <given-names>Yannick</given-names>
            </name>
            <name name-style="western">
              <surname>Daubail</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Jacquin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Durier</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Osseby</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Rouaud</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Giroud</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Trends in the incidence of ischaemic stroke in young adults between 1985 and 2011: the Dijon Stroke Registry</article-title>
          <source>J Neurol Neurosurg Psychiatry</source>
          <year>2014</year>
          <month>05</month>
          <volume>85</volume>
          <issue>5</issue>
          <fpage>509</fpage>
          <lpage>13</lpage>
          <pub-id pub-id-type="doi">10.1136/jnnp-2013-306203</pub-id>
          <pub-id pub-id-type="medline">24249786</pub-id>
          <pub-id pub-id-type="pii">jnnp-2013-306203</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Putaala</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Ischemic stroke in the young: Current perspectives on incidence, risk factors, and cardiovascular prognosis</article-title>
          <source>Eur Stroke J</source>
          <year>2016</year>
          <month>03</month>
          <day>08</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>28</fpage>
          <lpage>40</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31008265"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/2396987316629860</pub-id>
          <pub-id pub-id-type="medline">31008265</pub-id>
          <pub-id pub-id-type="pii">10.1177_2396987316629860</pub-id>
          <pub-id pub-id-type="pmcid">PMC6301217</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vangen-Lønne</surname>
              <given-names>Anne Merete</given-names>
            </name>
            <name name-style="western">
              <surname>Wilsgaard</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Johnsen</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Carlsson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mathiesen</surname>
              <given-names>EB</given-names>
            </name>
          </person-group>
          <article-title>Time trends in incidence and case fatality of ischemic stroke: the tromsø study 1977-2010</article-title>
          <source>Stroke</source>
          <year>2015</year>
          <month>05</month>
          <day>07</day>
          <volume>46</volume>
          <issue>5</issue>
          <fpage>1173</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1161/STROKEAHA.114.008387</pub-id>
          <pub-id pub-id-type="medline">25851772</pub-id>
          <pub-id pub-id-type="pii">STROKEAHA.114.008387</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krishnamurthi</surname>
              <given-names>RV</given-names>
            </name>
            <name name-style="western">
              <surname>Moran</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Feigin</surname>
              <given-names>VL</given-names>
            </name>
            <name name-style="western">
              <surname>Barker-Collo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Norrving</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Mensah</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Naghavi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Forouzanfar</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>CO</given-names>
            </name>
            <name name-style="western">
              <surname>Vos</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Roth</surname>
              <given-names>GA</given-names>
            </name>
          </person-group>
          <article-title>Stroke Prevalence, Mortality and Disability-Adjusted Life Years in Adults Aged 20-64 Years in 1990-2013: Data from the Global Burden of Disease 2013 Study</article-title>
          <source>Neuroepidemiology</source>
          <year>2015</year>
          <month>10</month>
          <day>28</day>
          <volume>45</volume>
          <issue>3</issue>
          <fpage>190</fpage>
          <lpage>202</lpage>
          <pub-id pub-id-type="doi">10.1159/000441098</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Putaala</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kurkinen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tarvos</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Salonen</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Kaste</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tatlisumak</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Silent brain infarcts and leukoaraiosis in young adults with first-ever ischemic stroke</article-title>
          <source>Neurology</source>
          <year>2009</year>
          <month>05</month>
          <day>26</day>
          <volume>72</volume>
          <issue>21</issue>
          <fpage>1823</fpage>
          <lpage>1829</lpage>
          <pub-id pub-id-type="doi">10.1212/WNL.0b013e3181a711df</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gall</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Phan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Madsen</surname>
              <given-names>TE</given-names>
            </name>
            <name name-style="western">
              <surname>Reeves</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Rist</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Jimenez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lichtman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lisabeth</surname>
              <given-names>LD</given-names>
            </name>
          </person-group>
          <article-title>Focused Update of Sex Differences in Patient Reported Outcome Measures After Stroke</article-title>
          <source>Stroke</source>
          <year>2018</year>
          <month>03</month>
          <volume>49</volume>
          <issue>3</issue>
          <fpage>531</fpage>
          <lpage>535</lpage>
          <pub-id pub-id-type="doi">10.1161/STROKEAHA.117.018417</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ayis</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Rudd</surname>
              <given-names>ag</given-names>
            </name>
            <name name-style="western">
              <surname>Ayerbe</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wolfe</surname>
              <given-names>CDA</given-names>
            </name>
          </person-group>
          <source>Sex differences in trajectories of depression symptoms and associations with 10-year mortality in stroke patients: The South London Stroke Register</source>
          <year>2019</year>
          <publisher-loc>London</publisher-loc>
          <publisher-name>The South London Stroke Register</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mathers</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>The global burden of disease update</article-title>
          <source>The Global Burden of Disease: 2004 Update</source>
          <year>2008</year>
          <publisher-loc>Geneve</publisher-loc>
          <publisher-name>World Health Organization</publisher-name>
          <fpage>2004</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Radu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Solomon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gheorghe</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Hostiuc</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bulescu</surname>
              <given-names>IA</given-names>
            </name>
            <name name-style="western">
              <surname>Purcarea</surname>
              <given-names>VL</given-names>
            </name>
          </person-group>
          <article-title>The adaptation of health care marketing to the digital era</article-title>
          <source>J Med Life</source>
          <year>2017</year>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>44</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28255375"/>
          </comment>
          <pub-id pub-id-type="medline">28255375</pub-id>
          <pub-id pub-id-type="pmcid">PMC5304370</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cabrera-Maqueda</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Minhas</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>New Horizons for Stroke Medicine: Understanding the Value of Social Media</article-title>
          <source>Stroke</source>
          <year>2018</year>
          <month>02</month>
          <volume>49</volume>
          <issue>2</issue>
          <fpage>25</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1161/STROKEAHA.117.020068</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bundy</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chick</surname>
              <given-names>JFB</given-names>
            </name>
            <name name-style="western">
              <surname>Hage</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Srinivasa</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>Chaudhary</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Srinivasa</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>Vadlamudi</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Gemmete</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>#Stroke</article-title>
          <source>J NeuroIntervent Surg</source>
          <year>2018</year>
          <month>04</month>
          <day>20</day>
          <volume>10</volume>
          <issue>12</issue>
          <fpage>e33</fpage>
          <lpage>e33</lpage>
          <pub-id pub-id-type="doi">10.1136/neurintsurg-2018-013877</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Adjustment to cancer - coping or personal transition?</article-title>
          <source>Psychooncology</source>
          <year>2001</year>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>18</lpage>
          <pub-id pub-id-type="medline">11180573</pub-id>
          <pub-id pub-id-type="pii">10.1002/1099-1611(200101/02)10:1&lt;1::AID-PON484&gt;3.0.CO;2-T</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>GH</given-names>
            </name>
            <name name-style="western">
              <surname>Todman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Broomfield</surname>
              <given-names>NM</given-names>
            </name>
          </person-group>
          <article-title>Post-stroke emotional adjustment: A modified social cognitive transition model</article-title>
          <source>Neuropsychological Rehabilitation</source>
          <year>2011</year>
          <month>12</month>
          <volume>21</volume>
          <issue>6</issue>
          <fpage>808</fpage>
          <lpage>824</lpage>
          <pub-id pub-id-type="doi">10.1080/09602011.2011.598403</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sylwester</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Purver</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Twitter Language Use Reflects Psychological Differences between Democrats and Republicans</article-title>
          <source>PLoS One</source>
          <year>2015</year>
          <month>9</month>
          <volume>10</volume>
          <issue>9</issue>
          <fpage>e0137422</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0137422"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0137422</pub-id>
          <pub-id pub-id-type="medline">26375581</pub-id>
          <pub-id pub-id-type="pii">PONE-D-15-11526</pub-id>
          <pub-id pub-id-type="pmcid">PMC4574198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kramer</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The spread of emotion via Facebook</article-title>
          <source>Proceedings of the SIGCHI Conference on Human Factors in Computing Systems</source>
          <year>2012</year>
          <conf-name>Presented atIGCHI Conference on Human Factors in Computing Systems</conf-name>
          <conf-date>2012</conf-date>
          <conf-loc>Austin, Texas</conf-loc>
          <publisher-loc>USA</publisher-loc>
          <publisher-name>ACM</publisher-name>
          <fpage>05</fpage>
          <lpage>10</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kern</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Sap</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>LK</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
          </person-group>
          <article-title>Gaining Insights From Social Media Language: Methodologies and Challenges</article-title>
          <source>Psychol Methods</source>
          <year>2016</year>
          <month>08</month>
          <day>8</day>
          <fpage>507</fpage>
          <lpage>525</lpage>
          <pub-id pub-id-type="doi">10.1037/met0000091</pub-id>
          <pub-id pub-id-type="medline">27505683</pub-id>
          <pub-id pub-id-type="pii">2016-38181-001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gohil</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vuik</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Darzi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Sentiment Analysis of Health Care Tweets: Review of the Methods Used</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2018</year>
          <month>04</month>
          <day>23</day>
          <volume>4</volume>
          <issue>2</issue>
          <fpage>e43</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://publichealth.jmir.org/2018/2/e43/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.5789</pub-id>
          <pub-id pub-id-type="medline">29685871</pub-id>
          <pub-id pub-id-type="pii">v4i2e43</pub-id>
          <pub-id pub-id-type="pmcid">PMC5938573</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ardon</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Spatio-Temporal Analysis of Topic Popularity in Twitter</article-title>
          <source>arXiv</source>
          <year>2011</year>
          <month>04</month>
          <day>05</day>
          <fpage>2904</fpage>
          <lpage>2908</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ghosh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zafar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bhattacharya</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ganguly</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <source>On sampling the wisdom of crowds: random vs. expert sampling of the twitter stream</source>
          <year>2013</year>
          <access-date>2019-08-06</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://ama.liglab.fr/wikiDeAMA/DOCS/randomvsexpert.pdf">http://ama.liglab.fr/wikiDeAMA/DOCS/randomvsexpert.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hoffmann</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>“Too many Americans are trapped in fear, violence and poverty”: a psychology-informed sentiment analysis of campaign speeches from the 2016 US Presidential Election</article-title>
          <source>Linguistics Vanguard</source>
          <year>2018</year>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1515/lingvan-2017-0008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Plutchik</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>The Nature of Emotions: Human emotions have deep evolutionary roots, a fact that may explain their complexity and provide tools for clinical practice</article-title>
          <source>American Scientist</source>
          <year>2001</year>
          <fpage>344</fpage>
          <lpage>350</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mohammad</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Turney</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Emotions evoked by common words and phrases: Using Mechanical Turk to create an emotion lexicon</article-title>
          <year>2010</year>
          <conf-name>NAACL-HLT Workshop on computational approaches to analysis and generation of emotion in text</conf-name>
          <conf-date>2010</conf-date>
          <conf-loc>California, US</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schweinberger</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A sociolinguistic analysis of emotives in Irish English</article-title>
          <year>2016</year>
          <conf-name>Annual Meeting of the Society for Text &amp; Discourse</conf-name>
          <conf-date>2016</conf-date>
          <conf-loc>Kassel</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dodds</surname>
              <given-names>PS</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Kloumann</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Bliss</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Danforth</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Temporal patterns of happiness and information in a global social network: hedonometrics and Twitter</article-title>
          <source>PLoS One</source>
          <year>2011</year>
          <month>12</month>
          <volume>6</volume>
          <issue>12</issue>
          <fpage>e26752</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0026752"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0026752</pub-id>
          <pub-id pub-id-type="medline">22163266</pub-id>
          <pub-id pub-id-type="pii">PONE-D-11-01360</pub-id>
          <pub-id pub-id-type="pmcid">PMC3233600</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reece</surname>
              <given-names>Ag</given-names>
            </name>
            <name name-style="western">
              <surname>Danforth</surname>
              <given-names>Cm</given-names>
            </name>
          </person-group>
          <article-title>Instagram photos reveal predictive markers of depression</article-title>
          <source>EPJ Data Sci</source>
          <year>2017</year>
          <month>8</month>
          <day>8</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>15</fpage>
          <pub-id pub-id-type="doi">10.1140/epjds/s13688-017-0110-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cody</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Reagan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dodds</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Danforth</surname>
              <given-names>Christopher M</given-names>
            </name>
          </person-group>
          <article-title>Climate Change Sentiment on Twitter: An Unsolicited Public Opinion Poll</article-title>
          <source>PLoS One</source>
          <year>2015</year>
          <volume>10</volume>
          <issue>8</issue>
          <fpage>e0136092</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0136092"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0136092</pub-id>
          <pub-id pub-id-type="medline">26291877</pub-id>
          <pub-id pub-id-type="pii">PONE-D-15-20850</pub-id>
          <pub-id pub-id-type="pmcid">PMC4546368</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kearney</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Package ‘rtweet’</source>
          <access-date>2019-03-19</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/rtweet/rtweet.pdf">https://cran.r-project.org/web/packages/rtweet/rtweet.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Webb</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jirotka</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stahl</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Housley</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Edwards</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Procter</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rana</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Burnap</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>The ethical challenges of publishing Twitter data for research dissemination</article-title>
          <year>2017</year>
          <conf-name>ACM on Web Science Conference</conf-name>
          <conf-date>2017</conf-date>
          <conf-loc>Troy, NY</conf-loc>
          <fpage>25</fpage>
          <lpage>28</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jockers</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Introduction to the Syuzhet package</source>
          <access-date>2019-08-06</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/syuzhet/vignettes/syuzhet-vignette.html">https://cran.r-project.org/web/packages/syuzhet/vignettes/syuzhet-vignette.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gries</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <source>Statistics for linguistics with R: A practical introduction</source>
          <year>2009</year>
          <publisher-loc>NY</publisher-loc>
          <publisher-name>Mouton de Gruyter</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Feinerer</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <source>Introduction to the tm Package: Text Mining in R</source>
          <access-date>2019-03-19</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/tm/vignettes/tm.pdf">https://cran.r-project.org/web/packages/tm/vignettes/tm.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Murzintcev</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <source>ldatuning: Tuning of the Latent Dirichlet Allocation Models Parameters</source>
          <access-date>2019-03-19</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/ldatuning/index.html">https://cran.r-project.org/web/packages/ldatuning/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Journal of Statistical Software</source>
          <access-date>2019-03-19</access-date>
          <comment>stm: R Package for Structural Topic Models 
          <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/stm/vignettes/stmVignette.pdf">https://cran.r-project.org/web/packages/stm/vignettes/stmVignette.pdf</ext-link></comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Lafferty</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>A correlated topic model of Science</article-title>
          <source>Ann Appl Stat</source>
          <year>2007</year>
          <month>06</month>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>17</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1214/07-AOAS114</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Waltman</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>van Eck</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Noyons</surname>
              <given-names>EC</given-names>
            </name>
          </person-group>
          <article-title>A unified approach to mapping and clustering of bibliometric networks</article-title>
          <source>Journal of Informetrics</source>
          <year>2010</year>
          <month>10</month>
          <volume>4</volume>
          <issue>4</issue>
          <fpage>629</fpage>
          <lpage>635</lpage>
          <pub-id pub-id-type="doi">10.1016/j.joi.2010.07.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mimno</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wallach</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Talley</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Leenders</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McCallum</surname>
              <given-names>A(</given-names>
            </name>
          </person-group>
          <article-title>Optimizing semantic coherence in topic models</article-title>
          <source>In Proceedings of the Conference on Empirical Methods in Natural Language Processing, EMNLP ?11, pp. 262?272. Association for Computational Linguistics, Stroudsburg, PA, USA</source>
          <year>2011</year>
          <conf-name>Conference on Empirical Methods in Natural Language Processing</conf-name>
          <conf-date>2011</conf-date>
          <conf-loc>Stroudsburg, PA, US</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Huo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Gender Differences in Emotional Response: Inconsistency between Experience and Expressivity</article-title>
          <source>PLoS ONE</source>
          <year>2016</year>
          <month>6</month>
          <day>30</day>
          <volume>11</volume>
          <issue>6</issue>
          <fpage>e0158666</fpage>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0158666</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sas</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dix</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hart</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Dramaturgical capitalization of positive emotions: The answer for Facebook success?</article-title>
          <year>2009</year>
          <conf-name>23rd British HCI group annual conference on people and computers: Celebrating people and technology</conf-name>
          <conf-date>2009</conf-date>
          <conf-loc>Swinton, UK</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Utz</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Social network site use among Dutch students: Effects of time and platform</article-title>
          <source>Networked Sociability and Individualism: Technology for Personal and Professional Relationships</source>
          <year>2011</year>
          <publisher-loc>Hershey, PA</publisher-loc>
          <publisher-name>IGI Global</publisher-name>
          <fpage>103</fpage>
          <lpage>125</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Forest</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Wood</surname>
              <given-names>JV</given-names>
            </name>
          </person-group>
          <article-title>When Social Networking Is Not Working</article-title>
          <source>Psychol Sci</source>
          <year>2012</year>
          <month>02</month>
          <day>07</day>
          <volume>23</volume>
          <issue>3</issue>
          <fpage>295</fpage>
          <lpage>302</lpage>
          <pub-id pub-id-type="doi">10.1177/0956797611429709</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reinecke</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Trepte</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Authenticity and well-being on social network sites: A two-wave longitudinal study on the effects of online authenticity and the positivity bias in SNS communication</article-title>
          <source>Computers in Human Behavior</source>
          <year>2014</year>
          <month>1</month>
          <volume>30</volume>
          <fpage>95</fpage>
          <lpage>102</lpage>
          <pub-id pub-id-type="doi">10.1016/j.chb.2013.07.030</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>Gregory</given-names>
            </name>
            <name name-style="western">
              <surname>Yaden</surname>
              <given-names>David Bryce</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>H Andrew</given-names>
            </name>
            <name name-style="western">
              <surname>Kern</surname>
              <given-names>Margaret L</given-names>
            </name>
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>Johannes C</given-names>
            </name>
            <name name-style="western">
              <surname>Kosinski</surname>
              <given-names>Michael</given-names>
            </name>
            <name name-style="western">
              <surname>Stillwell</surname>
              <given-names>David</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>Lyle H</given-names>
            </name>
            <name name-style="western">
              <surname>Seligman</surname>
              <given-names>Martin E P</given-names>
            </name>
          </person-group>
          <article-title>Women are Warmer but No Less Assertive than Men: Gender and Language on Facebook</article-title>
          <source>PLoS One</source>
          <year>2016</year>
          <volume>11</volume>
          <issue>5</issue>
          <fpage>e0155885</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0155885"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0155885</pub-id>
          <pub-id pub-id-type="medline">27223607</pub-id>
          <pub-id pub-id-type="pii">PONE-D-15-49892</pub-id>
          <pub-id pub-id-type="pmcid">PMC4881750</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
          <source>Omnicore</source>
          <access-date>2019-03-18</access-date>
          <comment>Twitter by the Numbers: Stats, Demographics &amp; Fun Facts 
          <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.omnicoreagency.com/twitter-statistics/">https://www.omnicoreagency.com/twitter-statistics/</ext-link></comment>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
          <source>Who is more active on Social Media?</source>
          <access-date>2019-03-19</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.digitalinformationworld.com/2014/10/who-is-more-active-on-social-media-men-or-women-infographic.html">https://www.digitalinformationworld.com/2014/10/who-is-more-active-on-social-media-men-or-women-infographic.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Padilla</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kavak</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gore</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Diallo</surname>
              <given-names>Saikou Y</given-names>
            </name>
          </person-group>
          <article-title>Temporal and spatiotemporal investigation of tourist attraction visit sentiment on Twitter</article-title>
          <source>PLoS One</source>
          <year>2018</year>
          <volume>13</volume>
          <issue>6</issue>
          <fpage>e0198857</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0198857"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0198857</pub-id>
          <pub-id pub-id-type="medline">29902270</pub-id>
          <pub-id pub-id-type="pii">PONE-D-18-02998</pub-id>
          <pub-id pub-id-type="pmcid">PMC6002102</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gore</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Diallo</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>You Are What You Tweet: Connecting the Geographic Variation in America?s Obesity Rate to Twitter Content</article-title>
          <source>PLoS ONE</source>
          <year>2015</year>
          <volume>You Are What You Tweet</volume>
          <fpage>1</fpage>
          <lpage>16</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1371/journal.pone.0133505"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brunner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hemsley</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Dann</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Togher</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Palmer</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Hashtag #TBI: A content and network data analysis of tweets about Traumatic Brain Injury</article-title>
          <source>Brain Injury</source>
          <year>2017</year>
          <month>12</month>
          <day>08</day>
          <volume>32</volume>
          <issue>1</issue>
          <fpage>49</fpage>
          <lpage>63</lpage>
          <pub-id pub-id-type="doi">10.1080/02699052.2017.1403047</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lachmar</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Wittenborn</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Bogen</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>McCauley</surname>
              <given-names>HL</given-names>
            </name>
          </person-group>
          <article-title>#MyDepressionLooksLike: Examining Public Discourse About Depression on Twitter</article-title>
          <source>JMIR Ment Health</source>
          <year>2017</year>
          <month>10</month>
          <day>18</day>
          <volume>4</volume>
          <issue>4</issue>
          <fpage>e43</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://mental.jmir.org/2017/4/e43/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/mental.8141</pub-id>
          <pub-id pub-id-type="medline">29046270</pub-id>
          <pub-id pub-id-type="pii">v4i4e43</pub-id>
          <pub-id pub-id-type="pmcid">PMC5666224</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="web">
          <source>Womens Brain Project</source>
          <access-date>2019-06-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.womensbrainproject.com/">http://www.womensbrainproject.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
