<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v21i5e12881</article-id>
      <article-id pub-id-type="pmid">31344669</article-id>
      <article-id pub-id-type="doi">10.2196/12881</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Modeling Spatiotemporal Factors Associated With Sentiment on Twitter: Synthesis and Suggestions for Improving the Identification of Localized Deviations</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Gore</surname>
            <given-names>Ross</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Du</surname>
            <given-names>Jingcheng</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Boonstra</surname>
            <given-names>Tjeerd</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="author" id="contrib1" corresp="yes">
          <name name-style="western">
            <surname>Shah</surname>
            <given-names>Zubair</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Centre for Health Informatics</institution>
            <institution>Australian Institute for Health Innovation</institution>
            <institution>Macquarie University</institution>
            <addr-line>75 Talavera Road, Macquarie Park</addr-line>
            <addr-line>Sydney, 2113</addr-line>
            <country>Australia</country>
            <phone>61 404941319</phone>
            <email>zubair.shah@mq.edu.au</email>
          </address>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-7389-3274</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib2">
          <name name-style="western">
            <surname>Martin</surname>
            <given-names>Paige</given-names>
          </name>
          <degrees>BE</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-6157-4740</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib3">
          <name name-style="western">
            <surname>Coiera</surname>
            <given-names>Enrico</given-names>
          </name>
          <degrees>PhD, MBBS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-6444-6584</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib4">
          <name name-style="western">
            <surname>Mandl</surname>
            <given-names>Kenneth D</given-names>
          </name>
          <degrees>MD, MPH</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-9781-0477</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib5">
          <name name-style="western">
            <surname>Dunn</surname>
            <given-names>Adam G</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-1720-8209</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
      <label>1</label>
      <institution>Centre for Health Informatics</institution>
      <institution>Australian Institute for Health Innovation</institution>  
      <institution>Macquarie University</institution>  
      <addr-line>Sydney</addr-line>
      <country>Australia</country></aff>
      <aff id="aff2">
      <label>2</label>
      <institution>Computational Health Informatics Program</institution>
      <institution>Boston Children’s Hospital</institution>  
      <addr-line>Boston, MA</addr-line>
      <country>United States</country></aff>
      <aff id="aff3">
      <label>3</label>
      <institution>Department of Biomedical Informatics</institution>
      <institution>Harvard Medical School</institution>  
      <addr-line>Boston, MA</addr-line>
      <country>United States</country></aff>
      <author-notes>
        <corresp>Corresponding Author: Zubair Shah 
        <email>zubair.shah@mq.edu.au</email></corresp>
      </author-notes>
      <pub-date pub-type="collection"><month>05</month><year>2019</year></pub-date>
      <pub-date pub-type="epub">
        <day>08</day>
        <month>05</month>
        <year>2019</year>
      </pub-date>
      <volume>21</volume>
      <issue>5</issue>
      <elocation-id>e12881</elocation-id>
      <!--history from ojs - api-xml-->
      <history>
        <date date-type="received">
          <day>29</day>
          <month>11</month>
          <year>2018</year>
        </date>
        <date date-type="rev-request">
          <day>24</day>
          <month>1</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>19</day>
          <month>3</month>
          <year>2019</year>
        </date>
        <date date-type="accepted">
          <day>29</day>
          <month>3</month>
          <year>2019</year>
        </date>
      </history>
      <copyright-statement>©Zubair Shah, Paige Martin, Enrico Coiera, Kenneth D Mandl, Adam G Dunn. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 08.05.2019.</copyright-statement>
      <copyright-year>2019</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2019/5/e12881/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Studies examining how sentiment on social media varies depending on timing and location appear to produce inconsistent results, making it hard to design systems that use sentiment to detect localized events for public health applications.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to measure how common timing and location confounders explain variation in sentiment on Twitter.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Using a dataset of 16.54 million English-language tweets from 100 cities posted between July 13 and November 30, 2017, we estimated the positive and negative sentiment for each of the cities using a dictionary-based sentiment analysis and constructed models to explain the differences in sentiment using time of day, day of week, weather, city, and interaction type (conversations or broadcasting) as factors and found that all factors were independently associated with sentiment.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>In the full multivariable model of positive (Pearson r in test data 0.236; 95% CI 0.231-0.241) and negative (Pearson r in test data 0.306; 95% CI 0.301-0.310) sentiment, the city and time of day explained more of the variance than weather and day of week. Models that account for these confounders produce a different distribution and ranking of important events compared with models that do not account for these confounders.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>In public health applications that aim to detect localized events by aggregating sentiment across populations of Twitter users, it is worthwhile accounting for baseline differences before looking for unexpected changes.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>text mining</kwd>
        <kwd>social media</kwd>
        <kwd>public health</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Data from social media are increasingly being used in the digital phenotyping of individual users and the characterization of population-level behaviors to answer health-related questions [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. Sentiment analysis is a broad class of methods used to detect opinions or mood from text. Although there are a range of approaches used in context-specific situations to detect positive and negative opinions about a topic [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref12">12</xref>], here we restrict the definition to include the general sentiment analysis methods used to detect mood. Sentiment analysis has also been used for applications in public health to evaluate reactions and attitudes to certain current events [<xref ref-type="bibr" rid="ref13">13</xref>], health interventions such as vaccination [<xref ref-type="bibr" rid="ref14">14</xref>], human mobility [<xref ref-type="bibr" rid="ref15">15</xref>], and outcomes such as seasonal affective disorder and obesity [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref18">18</xref>].</p>
        <p>When using sentiment analysis tools to observe or find signals of changes in the sentiment of a population, researchers must navigate the complicated interactions between the tools they use and the spatiotemporal and social factors that are known to modify mood and emotion. For example, the positive and negative affect measured by sentiment analysis has been shown to be associated with the time of day and day of week [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref21">21</xref>], weather [<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref25">25</xref>], and the quality of social interactions [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
        <p>Studies applying sentiment analysis to Twitter data have confirmed the periodicity of positive and negative affect by time of day and day of week [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref29">29</xref>]. However, the results and conclusions vary from study to study, and these differences may depend on the methods used to aggregate sentiment across sets of tweets or users, differences in the ways the investigators sampled the data, differences in the sentiment analysis algorithms or tools used, or because of challenges associated with validating results against external information. In comparison, studies examining variation in sentiment by geography or weather are relatively rare compared with those that measure temporal variation [<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref34">34</xref>]. Studies that report analyses for social interactions on Twitter—tweets that mention, reply to, or quote other users—do not appear to have focused on measuring differences in the sentiment relative to tweets that broadcast a message [<xref ref-type="bibr" rid="ref35">35</xref>].</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>The aim of this study was to construct simple models of positive and negative sentiment using time of day, day of week, interaction type, weather, or city as factors to understand how each of the different modifying factors might distort the results of public health studies that use sentiment analysis to study Twitter data. We then used the model and degenerate versions of the model to measure the magnitude of the differences between expected and observed sentiment over time and show how accounting for spatiotemporal differences affects the ranking of the importance of individual events.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <p>This study was an analysis of tweets posted by Twitter users in 100 cities. To address our aims, we aggregated sentiment scores for each hour in each of the 100 cities and constructed multivariable models to explain differences in the proportion of tweets, expressing positive or negative sentiment using city, interaction type, weather, time of day, and day of week as factors. We selected each of these factors because they have been shown to be associated with sentiment in past research and are relatively easily and accurately inferred from Twitter data.</p>
      <sec>
        <title>Twitter Data</title>
        <p>We used the Twitter streaming application programming interface (API) to collect tweets between July 13 and November 30, 2017, without using any keywords. The retrieved tweets represent an approximate 1% sample of all tweets produced globally. Each tweet contains information about the user including name, location, tweet counts, follower counts, and following counts and the information about the tweet itself such as timestamp and the users it mentions.</p>
        <p>Information in the tweet also provides information about whether it was a reply to a previous tweet, a retweet, or includes a link (quotes) to another tweet. We used this information to label each tweet as either broadcast (quotes, retweets, and tweets that do not mention other users) or social (replies and direct mentions of other users in the tweet).</p>
      </sec>
      <sec>
        <title>Location Data</title>
        <p>Identifying the home locations of users on Twitter is a challenging task owing to the low number of posts with precise location information (geotags) and the need to parse user-defined location information using a gazetteer. Fewer than 0.5% tweets are geotagged, and fewer than 50% of Twitter users have provided useful home locations in their profiles [<xref ref-type="bibr" rid="ref36">36</xref>]. To identify the location of the tweets from where it has been posted, we took the user-defined text from the location field in Twitter user profiles and used Nominatim, a gazetteer that returns a JavaScript Object Notation (JSON) object containing structured geographical information and a score associated with the confidence in the answer. Rather than filtering Nominatim results using a threshold on the confidence score, we found that Nominatim produces better results if we filter addresses based on type field of the return JSON object; therefore, we used type field in the returned JSON object to accept the top first address having type as city, county, village, suburb, hamlet, state, or country. This helped us to filter out other types of addresses without needing to use a specific threshold.</p>
        <p>Not all Twitter accounts represent individuals; some are brands or organizations where tweets may be posted by humans or bots. Rahimi et al [<xref ref-type="bibr" rid="ref37">37</xref>] used a simple but effective approach to removing <italic>celebrities</italic> in a study on location inference, in which they removed tweets from accounts that had more than 300,000 followers. After examining a set of Twitter users on either side of this threshold in our training data, we followed the same approach and removed all users with at least 300,000 followers.</p>
      </sec>
      <sec>
        <title>Timing Data</title>
        <p>Past studies examining temporal patterns in sentiment on social media have found clear patterns [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. However, those patterns vary substantially from study to study: some observed the most negative sentiment on Mondays and the most positive sentiment on Fridays or Saturdays. Some observed the strongest negative sentiment between 2 am and 5 am, whereas others observed the same between 8 pm and 11 pm.</p>
        <p>As Twitter no longer includes a localized timestamp for users in the metadata of tweets, we used the identified location of the users posting the tweets to convert the timestamps of tweets from Universal Time Coordinated to local time. In what follows, all tweets are considered relative to the local time of the city in which the user is believed to be located.</p>
      </sec>
      <sec>
        <title>Weather Data</title>
        <p>Past studies examining weather and sentiment on Twitter have produced variable results, but most observe one or more associations [<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>]. We collected hourly weather data for the top 100 cities using the API from the Open Weather website [<xref ref-type="bibr" rid="ref38">38</xref>]. The information provided by the Open Weather website includes detailed weather information, such as temperature and humidity, and weather descriptions. We then mapped weather for each hour in each city to one of 7 values: clear, clouds, fog, haze, rain, snow, or storm.</p>
      </sec>
      <sec>
        <title>Sentiment Measures</title>
        <p>Sentiment analysis of written text is a widely studied problem in natural language processing [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref41">41</xref>]. In this study, we have considered sentiment in a simple form—the presence of positive or negative affect—and applied SentiStrength [<xref ref-type="bibr" rid="ref42">42</xref>], a widely used open-source Java library designed for sentiment analysis of tweets. It has been evaluated manually and compared with a range of advanced machine learning and statistical methods in several studies [<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref44">44</xref>]. SentiStrength is a dictionary-based method, using a lexicon of words categorized as positive or negative with a score for its polarity and strength. For a given tweet, SentiStrength identifies the presence of sentiment terms from its lexicon and computes the sentiment of the text based upon the scores of the words found. SentiStrength produces 2 scores for each tweet, one indicating positive sentiment (from 1 to 5, least positive to most positive, respectively) and one indicating negative sentiment (from 1 to 5, least negative to most negative, respectively). As SentiStrength uses a score of +1 or −1 for neutral words, we considered scores from 2 to 5 for both positive and negative sentiments. In addition, as SentiStrength identifies positive and negative words independently, it is possible for a tweet to be labeled as having positive, negative, or both positive and negative sentiment.</p>
        <p>We aggregated sentiment scores across a set of tweets using the proportion of tweets that have a positive sentiment score (a score from 2 to 5 in positive sentiment) or the proportion of tweets that have a negative sentiment score (a score from 2 to 5 in negative sentiment). Methods for aggregating scores across groups of tweets are important because they can influence the interpretation and lead to different conclusions. To aggregate sentiment scores, researchers have used counts, averages, proportions, ratios, and weighted averages [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref45">45</xref>-<xref ref-type="bibr" rid="ref50">50</xref>]. Some have combined positive and negative scores to create a single measure [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref49">49</xref>], whereas others have kept positive and negative scores separate [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref51">51</xref>]. Following Scott et al [<xref ref-type="bibr" rid="ref16">16</xref>], we used positive and negative sentiment scores separately because the positive and negative affect can coexist [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>] and because when aggregated, a population can exhibit higher levels of both positive and negative sentiment at the same time. Thus, a low positive score indicates the absence of positive emotion across a set of tweets not the presence of negative emotion.</p>
      </sec>
      <sec>
        <title>Analysis and Modeling</title>
        <p>In the first part of the analysis, we examined how each of the factors—interaction type, time of day, day of week, weather, and city—were associated with differences in the proportions of tweets that expressed positive or negative sentiment in a city in an hour. To do this, we constructed multivariable regression models using each of the factors individually and then in combination. We chose to use multivariable regression models because they are a simple way of capturing the baseline patterns of sentiment, and models built using individual factors and their combinations can be directly compared. For each model, we reported the r-squared value as a percentage, representing the percentage of the variance in sentiment that can be explained by each model.</p>
        <p>In our evaluation of the models on unseen data, we then reported the correlation (Pearson r) between the values predicted by the model and the observed data in a set of testing data, distinct from the period of observation used to construct the models. These comparisons tell us how important each of the factors are as independent predictors of the sentiment for a city-hour pair and can provide guidance on which of the factors may be useful to control for when analyzing sentiment to detect changes or anomalies.</p>
        <p>In the second part of the analysis, we have used the models constructed in the first part of the analysis as a baseline for detecting deviations from the expected proportions of positive and negative sentiment tweets per city per hour. The objective was to determine whether baseline differences in spatiotemporal and social factors would introduce biases in the detection of extreme deviations in sentiment that occur during major localized news events and if accounting for them in a baseline model could address these biases. To do this, we compared the expected and observed proportions of positive and negative sentiment tweets per city per hour using a chi-square test and then used the resulting <italic>P</italic> value as an indicator of the magnitude of the deviation.</p>
        <p>Rather than defining an explicit threshold to label hour-city pairs as events or nonevents, we used the magnitude of the deviation in sentiment to rank all hour-city pairs in descending order based on the chi-square test. To make it easier to understand the expected frequency of the events, we defined a recurrence interval: the number of days of observation divided by the frequency of an event of that magnitude across the set of all cities in the analyses. For example, given 60 days of observation in the test period, a recurrence interval of 30 days is an event with a test statistic that was exceeded only twice during the 60 days. A recurrence interval of 1 day is an event with a magnitude that was exceeded 60 times in a 60-day period.</p>
        <p>To characterize an event by its magnitude, we also needed to account for extreme sentiment that persisted for multiple hours or was expressed across multiple cities within a country. To do this, we merged events that produced significant differences between the observed and predicted number of positive or negative sentiment tweets and labeled them using the highest test statistic in the period. Similarly, we merged cities within a country if significant events occurred at the same time. As a result, hour-city pairs could be merged to produce day-city, day-country, or multi–day-country events depending on how many of the ranked deviations were traversed.</p>
        <p>We then compared the events identified from the full model with the events produced by degenerate forms of the full model (eg, excluding city or interaction type as a factor). We used these differences to evaluate how the use of baseline spatiotemporal modeling affected the identification and ranking of extreme sentiment events. The expectation was that the degenerate forms of the models would introduce a bias in the distribution of events toward certain cities or times of day.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>On average, we received 3.66 million tweets a day for 141 days, for a total of 507.60 million tweets from 27.61 million unique users. In the dataset, Twitter tagged 29.78% (151.21/507.60 million) as English language. Of these, 65.67% (99.30/151.21 million) had location information available in the users’ profiles.</p>
      <p>After removing celebrity/brand accounts, we ranked cities based on the total number of English language tweets posted by users with locations that the gazetteer was able to resolve. We identified the 100 cities with the highest numbers of English language tweets posted during the study period. These included 52 cities in North America (45 from the United States, 6 from Canada, and 1 from Mexico), 11 cities in the United Kingdom, 6 cities from Europe, 16 cities in Asia and Southeast Asia, 9 cities in Africa, 3 cities in Australasia, 2 cities from the Middle East, and 1 city in South America. We were able to resolve 16.61% (16.50/99.30 million) of the English language tweets to one of the 100 cities (<xref ref-type="fig" rid="figure1">Figure 1</xref>). We used these tweets as the basis for the study.</p>
      <sec>
        <title>Analysis of Spatiotemporal and Social Factors</title>
        <p>The training data used to construct the multivariable models comprised 8.39 million tweets from the first 81 days of data collection (July 13 to September 30, 2017). Of these, we found that 39.69% (3.33 million) expressed positive sentiment and 28.13% (2.36 million) expressed negative sentiment. Users across the 100 cities posted more tweets on Monday to Thursday and slightly fewer tweets from Friday to Sunday. The hour in which users were typically most active was between 12 noon and 1 pm (an average of 7652 tweets across the 100 cities), and users were least active between 4 am and 5 am (an average of 1745 tweets across the 100 cities). The number of tweets in each category of weather varied from snow (230 tweets) and storms (189,201 tweets) to cloudy weather (3,247,680 tweets). Relative to the average proportions of positive and negative sentiment, early morning hours exhibited lower proportions for both positive and negative sentiment, with the highest proportions of positive sentiment between 9 pm and 10 pm and highest rates of negative sentiment in the hours between 11 pm and 1 am, with an additional smaller peak between 7 am and 8 am (<xref ref-type="fig" rid="figure2">Figure 2</xref>). Fridays exhibited the highest proportion of positive sentiment and the lowest proportion of negative sentiment.</p>
        <p>We constructed each model to estimate the proportion of tweets that expressed positive or negative sentiment in a city in an hour and have presented results based on the correlation between the estimated and observed proportions within the training data (<xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>From 507.6 million tweets, 16.5 million were labelled as English language and attributed to users in 100 cities.</p>
          </caption>
          <graphic xlink:href="jmir_v21i5e12881_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Observed proportions of positive and negative sentiment aggregated for all city-hour pairs by hour of the day (top), day of the week (center), and weather type (below). CIs are an indication of the number of city-hour pairs that contributed and the variability in proportion for that value. All values are categorical, so dotted lines are for visual interpretation only.</p>
          </caption>
          <graphic xlink:href="jmir_v21i5e12881_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Final model coefficient estimates for models of the proportion of tweets that exhibited negative sentiment in an hour.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="210"/>
            <col width="250"/>
            <col width="240"/>
            <col width="280"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Factor</td>
                <td>Number of coefficients (number <italic>P</italic>&lt;.05)</td>
                <td>r-squared in the training period, %</td>
                <td>Pearson r (95% CI) in the testing period</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="5"><bold>Multiple factor models</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>All factors</td>
                <td>136 (108)</td>
                <td>9.345</td>
                <td>0.306 (0.301-0.310)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Social, city, hour, day</td>
                <td>130 (107)</td>
                <td>9.338</td>
                <td>0.306 (0.301-0.310)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Social, city</td>
                <td>101 (80)</td>
                <td>8.831</td>
                <td>0.297 (0.292-0.302)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Hour, day</td>
                <td>30 (26)</td>
                <td>0.486</td>
                <td>0.070 (0.065-0.075)</td>
              </tr>
              <tr valign="top">
                <td colspan="5"><bold>Single factor models</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>City</td>
                <td>100 (81)</td>
                <td>8.736</td>
                <td>0.296 (0.291-0.300)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Hour of day</td>
                <td>24 (20)</td>
                <td>0.298</td>
                <td>0.055 (0.049-0.060)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Day of week</td>
                <td>7 (7)</td>
                <td>0.191</td>
                <td>0.044 (0.039-0.049)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Weather</td>
                <td>7 (5)</td>
                <td>0.193</td>
                <td>0.044 (0.039-0.049)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Social proportion</td>
                <td>2 (2)</td>
                <td>0.010</td>
                <td>0.010 (0.005-0.015)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Final model coefficient estimates for models of the proportion of tweets that exhibited positive sentiment in an hour.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="210"/>
            <col width="250"/>
            <col width="240"/>
            <col width="280"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Factor</td>
                <td>Number of coefficients (number <italic>P</italic>&lt;.05)</td>
                <td>r-squared in the training period, %</td>
                <td>Pearson r (95% CI) in the testing period</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="5"><bold>Multiple factor models</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>All factors</td>
                <td>136 (107)</td>
                <td>5.584</td>
                <td>0.236 (0.231-0.241)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Social, city, hour, day</td>
                <td>130 (107)</td>
                <td>5.580</td>
                <td>0.236 (0.231-0.241)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Social, city</td>
                <td>101 (85)</td>
                <td>4.671</td>
                <td>0.216 (0.211-0.221)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Hour, day</td>
                <td>30 (26)</td>
                <td>1.330</td>
                <td>0.115 (0.110-0.133)</td>
              </tr>
              <tr valign="top">
                <td colspan="5"><bold>Single factor models</bold></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>City</td>
                <td>100 (90)</td>
                <td>3.732</td>
                <td>0.193 (0.188-0.198)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Hour of day</td>
                <td>24 (21)</td>
                <td>1.271</td>
                <td>0.113 (0.108-0.118)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Day of week</td>
                <td>7 (6)</td>
                <td>0.053</td>
                <td>0.023 (0.018-0.028)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Weather</td>
                <td>7 (5)</td>
                <td>0.170</td>
                <td>0.041 (0.036-0.046)</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Social proportion</td>
                <td>2 (2)</td>
                <td>1.387</td>
                <td>0.118 (0.113-0.123)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>A model combining both temporal factors was significantly correlated with the proportion of tweets expressing negative sentiment (r=0.070; 95% CI 0.065-0.070). The association was stronger with the proportion of tweets expressing positive sentiment (r=0.115; 95% CI 0.110-0.133) and explained 5% of the variance. For both positive and negative sentiment outcomes, adding the day of the week to the hour of the day in the model produced a significant improvement in the model.</p>
        <p>Positive and negative sentiment also varied by interaction type, where social tweets (tweets that mention or reply to another user) were much more likely to be expressions of positive sentiment relative to nonsocial tweets (tweets that do not mention or reply to another user). In hours where higher proportions of tweets were social interactions, the proportion of tweets that expressed positive sentiment were higher (r=0.118; 95% CI 0.113-0.123) and the proportion of tweets that expressed negative sentiment were lower (r=0.010; 95% CI 0.005-0.015) but this was a much weaker association. Adding the proportion of tweets that were social interactions as a factor in multivariable models made a significant improvement to the performance of the model in all cases.</p>
        <p>The median number of tweets per city during the testing period was 48,974 and the number varied from 24,825 (Istanbul, Turkey) to 856,471 (New York City, United States). The numbers of tweets generally matched with the populations of the cities (<xref ref-type="fig" rid="figure3">Figure 3</xref>) and was lower for countries where languages other than English are used. Cities in the United States tended to have higher proportions of negative sentiment tweets and lower proportions of positive sentiment tweets (<xref ref-type="fig" rid="figure4">Figure 4</xref>). Models using only city information exhibited the strongest correlation with the proportion of positive and negative sentiment tweets in an hour compared with all other factors, explaining 8.73% of the variance in negative sentiment (r=0.296; 95% CI 0.291-0.300) and 3.70% of the variance in positive sentiment (r=0.193; 95% CI 0.188-0.198).</p>
        <p>Weather exhibited weak associations with the proportions of tweets expressing positive (r=0.041; 95% CI 0.036-0.046) or negative sentiment (r=0.044; 95% CI 0.039-0.049). Its addition to the multivariable model including all other factors significantly improved the performance. However, as the coefficients for weather were orders of magnitude smaller than other factors such as city and social proportion, weather did not appear to be a useful addition to the baseline models used in the detection of variation in sentiment caused by exogenous factors.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>The number of tweets identified per city relative to the population of the city. Population data were manually collected from Wikipedia in December 2017, using the most recent metropolitan values available. Cities in the United States are highlighted in red and cities are partially labelled.</p>
          </caption>
          <graphic xlink:href="jmir_v21i5e12881_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Sentiment by city in the training period, by proportion of positive (cyan) and negative (orange) sentiment tweets. Cities are ranked in decreasing order of the mean of the proportion of tweets with positive sentiment minus the proportion of tweets with negative sentiment.</p>
          </caption>
          <graphic xlink:href="jmir_v21i5e12881_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Detecting Deviations in City-Level Expression of Positive or Negative Sentiment</title>
        <p>We then used the models constructed above to predict the expected sentiment in city-hour pairs constructed from a separate set of 8.02 million tweets from the following 60 days (October 1 to November 30, 2017). We found similar proportions of tweets expressing positive sentiment (3.20/8.02 million, 39.90%) or negative sentiment (2.28/8.02, 28.43%) as we found in the training data. For every hour-city pair, we determined the magnitude of localized deviations by measuring the difference between the expected and observed proportions of positive and negative sentiment tweets.</p>
        <p>Using the full model to identify unexpected deviations in the proportion of positive or negative sentiment tweets in the test period, we ranked events based on the magnitude of the deviation (<xref ref-type="fig" rid="figure5">Figure 5</xref>). As the number of events that might be considered important may vary depending on application, we have used the rank set of all city-hour pairs and traverse the list from the most extreme deviations to the least extreme deviations.</p>
        <p>The top examples of localized deviations are listed in <xref ref-type="table" rid="table3">Table 3</xref>. We aggregated hour-city pairs across contiguous hours and cities wherever possible by reporting the most extreme deviation and merging any subsequent (less extreme) deviation that was on the same day (eg, extreme deviations in sentiment in the same direction on the same day in the same city are merged and reported as a day event) or cities in the same country (eg, 10 am in New York City and 10 am in Los Angeles is reported as 10 am in the United States). This was also extended to merge over both dimensions to report events by country and day. Where contiguous days reported events in the same direction, these events were merged as multi-day events.</p>
        <p>After accounting for city-level differences in baseline proportions of positive and negative sentiment tweets, we found that the highest ranked events were distributed across 7 countries and could be retrospectively matched with major news stories that were specific to each of the cities. Using the degenerate models that do not account for city-level baseline differences, the United States accounted for a lower proportion of extreme positive events (<xref ref-type="fig" rid="figure6">Figure 6</xref>). This occurs because cities in the United States tend to exhibit higher rates of negative sentiment and lower rates of positive sentiment than cities in other countries. Models that do not take this baseline difference into account may overestimate the number of important negative events in the United States (which also has the effect of making violence in Barcelona or Nairobi seem less important) or underestimate the number of positive events in the United States (shifting down positive sentiment events such as Thanksgiving Day parade in New York City, New York or the World Series win in Houston, Texas).</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>The set of all city-hour pairs for negative sentiment (left) and positive sentiment (right), ordered by decreasing the chi-square test statistic value. Note that there are thousands of city-hour pairs for which the test produces a P value under .05 (red). The recurrence interval for each city-hour pair is given by the value on the horizontal axis divided by the observation period in days (60 days).</p>
          </caption>
          <graphic xlink:href="jmir_v21i5e12881_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Examples of extreme city-level events with large deviations detected in sentiment.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="240"/>
            <col width="200"/>
            <col width="200"/>
            <col width="160"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td>Time and location</td>
                <td>Percentage of negative sentiment tweets (% expected)</td>
                <td>Percentage of positive sentiment tweets (% expected)</td>
                <td>Recurrence interval (global; days)</td>
                <td>Corresponding news event in the period</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>October 2, 2017 in the United States</td>
                <td>49.56 (28.70)</td>
                <td>31.30 (38.14)</td>
                <td>&gt;60</td>
                <td>Coverage following Las Vegas shooting</td>
              </tr>
              <tr valign="top">
                <td>November 25-27 in Manila</td>
                <td>12.13 (22.91)</td>
                <td>73.20 (45.67)</td>
                <td>30</td>
                <td>Miss Universe pageant</td>
              </tr>
              <tr valign="top">
                <td>October 1-2, 2017 in Las Vegas</td>
                <td>61.51 (30.72)</td>
                <td>48.32 (40.52)</td>
                <td>20</td>
                <td>Shooting terror event at a music festival</td>
              </tr>
              <tr valign="top">
                <td>October 1, 2017 in Barcelona</td>
                <td>60.89 (23.78)</td>
                <td>14.67 (39.56)</td>
                <td>12</td>
                <td>Voting for Catalonian independence</td>
              </tr>
              <tr valign="top">
                <td>October 16, 2017 in Barcelona</td>
                <td>67.41 (23.78)</td>
                <td>17.8 (39.67)</td>
                <td>10</td>
                <td>Catalonian independence events</td>
              </tr>
              <tr valign="top">
                <td>November 2, 2017 in Houston</td>
                <td>14.41 (31.61)</td>
                <td>56.60 (38.20)</td>
                <td>8.6</td>
                <td>Houston Astros win world series</td>
              </tr>
              <tr valign="top">
                <td>November 23, 2017 in New York City</td>
                <td>20.40 (29.01)</td>
                <td>50.51 (37.40)</td>
                <td>7.5</td>
                <td>Thanksgiving Day parade</td>
              </tr>
              <tr valign="top">
                <td>October 19, 2017 in Dubai</td>
                <td>8.11 (25.01)</td>
                <td>92.13 (39.02)</td>
                <td>6</td>
                <td>Diwali festival</td>
              </tr>
              <tr valign="top">
                <td>October 27, 2017 in Nairobi</td>
                <td>48.50 (26.52)</td>
                <td>22.13 (37.32)</td>
                <td>5.5</td>
                <td>Riots following election</td>
              </tr>
              <tr valign="top">
                <td>November 27, 2017 in Seoul</td>
                <td>8.02 (21.01)</td>
                <td>71.67 (43.30)</td>
                <td>5</td>
                <td>2 North Korean embarrassments</td>
              </tr>
              <tr valign="top">
                <td>November 24, 2017 in London</td>
                <td>35.50 (26.51)</td>
                <td>47.12 (37.89)</td>
                <td>4.6</td>
                <td>False terror scare in Oxford Circus</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Most positive events for the 3 models aggregated where possible over hours, days, and cities. Note that compared with the full model (left), events from the United States tend to be moderated by the baseline tendency away from positive sentiment in the model without cities as factors (centre), and the null model (right).</p>
          </caption>
          <graphic xlink:href="jmir_v21i5e12881_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>From among the examples listed in <xref ref-type="table" rid="table3">Table 3</xref>, the visualization of the extreme events illustrates different types of deviations from the baseline (<xref ref-type="fig" rid="figure7">Figure 7</xref>). In each example, the expected baseline is the expected proportion of positive sentiment and negative sentiment tweets in an hour multiplied by the number of tweets from that city. Unexpected deviations occur when the observed number of positive or negative sentiment tweets is much higher or much lower than the baseline (in <xref ref-type="fig" rid="figure7">Figure 7</xref>, colored in red or blue). There were visible differences in the patterns indicating events that occur over a period of time (eg, riots after an election in Nairobi and a day of attempted voting in Barcelona) and events that occur within 1 or several hours (Houston Astros winning a baseball final). Other events not pictured include the outpouring of grief across multiple cities in the United States after a mass shooting, which decay more slowly over a period of days.</p>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Examples of individual cities (New York City, Barcelona, Houston, and Nairobi) by the expected (gray areas) and observed (black and colored lines) sentiment. The color of the line indicates the magnitude of the deviation (darker red: more negative or fewer positive tweets; darker blue: more positive or fewer negative tweets).</p>
          </caption>
          <graphic xlink:href="jmir_v21i5e12881_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>When applying sentiment analysis tools to Twitter data to characterize a population over time, it is useful to account for baseline spatiotemporal differences before attempting to detect deviations in mood. The first contribution of this study was to show that hour of day, day of week, the proportion of social tweets, the locations of the users posting the tweets, and the weather are each independently correlated with both positive and negative sentiment. Second, although these factors together account for less than 10% of the variance in positive and negative sentiment, ignoring them can affect the detection of unexpected deviations. Finally, we confirmed that in studies aggregating across populations (ecological designs), positive and negative sentiment can rise and fall independently and aggregating them into a single measure may mean losing important information that helps characterize the mood of a population.</p>
      <sec>
        <title>Comparisons With Past Literature and Implications</title>
        <p>A range of studies have applied sentiment analysis tools to social media data to examine changes in mood or emotion in relation to current events, weather and season, or circadian and daily rhythms. Our results extend these analyses to demonstrate the relative importance of each of these factors.</p>
        <p>We found that the time of day and day of week were more closely correlated with positive sentiment than with negative sentiment. For positive sentiment, models built using these temporal factors typically explain less of the variance than models that used social interactions and cities as factors. Previous studies investigating hourly and daily patterns of sentiment on Twitter vary in structure from cohort designs, where individual users are followed [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref54">54</xref>], to ecological designs where signals from a population are aggregated [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]. The results of these studies and the conclusions they draw appear to be related to design choices including the tools used to measure sentiment and the methods used to aggregate measures of sentiment across populations.</p>
        <p>The results of the study are consistent with previous studies that have found associations between weather and sentiment on Twitter [<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>]. Despite the observed independent correlations between weather and sentiment, weather explained little of the variance in positive or negative sentiment. These results should not be confused with seasonal variation in weather or sunlight; our results did not extend across a full range of seasons, and other studies have examined the use of Twitter data for its potential to observe seasonal affective disorder [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. Mitchell et al [<xref ref-type="bibr" rid="ref30">30</xref>] examined the geography of happiness in 373 cities in the United States using Twitter data and found that happiness was correlated with socioeconomic status and health-related census data, among other factors. We found that negative sentiment was more common and positive sentiment less common in tweets from many cities in the United States and suggest that future research in the area would benefit from studying international differences in sentiment associated with culture and patterns of living and working that might influence the expression of sentiment on social media.</p>
        <p>Tweets that involve social interactions on Twitter (typically replies and mentions) are common in applications of network science. Our results show a strong positive correlation between the proportion of social interactions in a city in an hour and positive sentiment and a weak correlation with negative sentiment. Future applications that couple network analysis with sentiment tools may benefit from recognizing and potentially accounting for the differences between tweets that are social in nature, relative to those that are broadcasting information.</p>
        <p>Twitter and other social media platforms offer the opportunity to undertake naturalistic studies of human behaviors at unprecedented scales [<xref ref-type="bibr" rid="ref56">56</xref>-<xref ref-type="bibr" rid="ref59">59</xref>]. However, studies in the area are at risk of producing incomparable results and inconsistent conclusions if sampling methods vary in ways that skew toward certain locations or certain times of the day or week. Practitioners in the area are already aware of the risks of selecting only geotagged tweets [<xref ref-type="bibr" rid="ref60">60</xref>], but the spatiotemporal differences we highlight here are typically not discussed or accounted for in applications that use Twitter data to answer public health questions.</p>
      </sec>
      <sec>
        <title>Limitations and Future Work</title>
        <p>The study has several limitations. First, Twitter users represent a biased sample of countries and a biased sample of the population within countries [<xref ref-type="bibr" rid="ref60">60</xref>-<xref ref-type="bibr" rid="ref64">64</xref>], and we did not infer the demographics nor apply any reweighting methods to adjust for differences between the users posting English language tweets and the demographics of the cities we examined. Furthermore, users who include enough biographical information to be located within a city may represent a biased subset of the overall Twitter population, and we did not use location inference methods that take advantage of location-indicative words or social network structure [<xref ref-type="bibr" rid="ref65">65</xref>-<xref ref-type="bibr" rid="ref68">68</xref>] because these could introduce further sampling biases (eg, the overlapping of words in the dictionary and those that are useful in predicting a location). For these reasons, the study only captures deviations that might be expected to be important to population-level (epidemiological) studies.</p>
        <p>Second, we used SentiStrength as a measure of sentiment and did not consider alternatives, sentiment in languages other than English, or ensembles combining multiple tools [<xref ref-type="bibr" rid="ref69">69</xref>-<xref ref-type="bibr" rid="ref72">72</xref>]. We think our use of SentiStrength is justified because it is a commonly used tool in studies in public health and has been examined for sentence-level sentiment and on individual tweets previously [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]. Although we did not test multiple sentiment detection methods to confirm, we expect that the need to account for baseline spatiotemporal differences is likely to be useful across all other sentiment detection approaches.</p>
        <p>Third, certain events are less localized and affect multiple cities or even multiple countries and others may extend across many hours, days, or weeks. Methods for dealing with the spatiotemporal granularity of these events would be a useful addition to the sets of methods used in analyses of sentiment (or other measures that can be observed in social media datasets). Real-time event detection on Twitter is an active area of research [<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref74">74</xref>], and our aim was not to add to this literature. Rather, we sought to develop a way to improve the robustness of observational studies that use sentiment analysis of Twitter to make sense of how populations react to real-world events.</p>
        <p>Finally, we selected a set of factors that were known to be associated with sentiment on Twitter and used a relatively simple approach to modeling their associations. Other user-level factors and more sophisticated models may improve our ability to account for baseline differences in sentiment, including heterogeneity of individual-level differences that are apparent at population-level scales. For example, other factors that could have been included are gender, age, and number of followers; and other modeling pipelines might consider feature selection or dimensionality reduction and cross-validation techniques to avoid overfitting and improve generalization.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In this study we showed that in applications that use population-level measures of sentiment on Twitter, it is useful to account for baseline differences in sentiment by time of day, day of week, location, weather, and interaction type. Doing so could improve the accuracy of methods that use sentiment to detect localized events or changes in mood. The first contribution of this research is the consistent evaluation of a broad set of factors—making it easier to compare the importance of location, time, and social interactions on positive and negative sentiment. The second contribution is the use of these factors to construct a simple and interpretable model of the expected variation in positive and negative sentiment on Twitter.</p>
      </sec>
    </sec>
  </body>
  <back>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">JSON</term>
          <def>
            <p>JavaScript Object Notation</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This research was supported by funding from the National Health and Medical Research Council (Project APP1128968).</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Centola</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Social media and the science of health behavior</article-title>
        <source>Circulation</source>  
        <year>2013</year>  
        <month>05</month>  
        <day>28</day>  
        <volume>127</volume>  
        <issue>21</issue>  
        <fpage>2135</fpage>  
        <lpage>44</lpage>  
        <pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.112.101816</pub-id>
        <pub-id pub-id-type="medline">23716382</pub-id>
        <pub-id pub-id-type="pii">127/21/2135</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Salathé</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Bengtsson</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Bodnar</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Brewer</surname>
            <given-names>DD</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
          <name name-style="western">
            <surname>Buckee</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Campbell</surname>
            <given-names>EM</given-names>
          </name>
          <name name-style="western">
            <surname>Cattuto</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Khandelwal</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Mabry</surname>
            <given-names>PL</given-names>
          </name>
          <name name-style="western">
            <surname>Vespignani</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Digital epidemiology</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2012</year>  
        <volume>8</volume>  
        <issue>7</issue>  
        <fpage>e1002616</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1002616"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1002616</pub-id>
        <pub-id pub-id-type="medline">22844241</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-12-00494</pub-id>
        <pub-id pub-id-type="pmcid">PMC3406005</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>How social media will change public health</article-title>
        <source>IEEE Intell Syst</source>  
        <year>2012</year>  
        <volume>27</volume>  
        <issue>4</issue>  
        <fpage>81</fpage>  
        <lpage>84</lpage>  
        <pub-id pub-id-type="doi">10.1109/MIS.2012.76</pub-id></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <source>Association for the Advancement of Artificial Intelligence</source>  
        <year>2011</year>  
        <access-date>2019-04-17</access-date>
        <comment>You are what you Tweet: Analyzing Twitter for public health 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cs.jhu.edu/~mdredze/publications/twitter_health_icwsm_11.pdf">https://www.cs.jhu.edu/~mdredze/publications/twitter_health_icwsm_11.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="77iSu3Co2"/></comment> </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Coppersmith</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Harman</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <source>Association for Computational Linguistics</source>  
        <year>2014</year>  
        <access-date>2019-04-17</access-date>
        <comment>Quantifying mental health signals in Twitter 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cs.jhu.edu/~mdredze/publications/2014_acl_mental_health.pdf">https://www.cs.jhu.edu/~mdredze/publications/2014_acl_mental_health.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="77iT5hB1a"/></comment> </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Choudhury</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Counts</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Horvitz</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Social media as a measurement tool of depression in populations</article-title>
        <source>Proceedings of the 5th Annual ACM Web Science Conference</source>  
        <year>2013</year>  
        <conf-name>WebSci '13</conf-name>
        <conf-date>May 02-04, 2013</conf-date>
        <conf-loc>Paris, France</conf-loc>
        <pub-id pub-id-type="doi">10.1145/2464464.2464480</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Althouse</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Scarpino</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Meyers</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Ayers</surname>
            <given-names>JW</given-names>
          </name>
          <name name-style="western">
            <surname>Bargsten</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Baumbach</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Brownstein</surname>
            <given-names>JS</given-names>
          </name>
          <name name-style="western">
            <surname>Castro</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Clapham</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Cummings</surname>
            <given-names>DA</given-names>
          </name>
          <name name-style="western">
            <surname>Del Valle</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Eubank</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Fairchild</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Finelli</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Generous</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>George</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Harper</surname>
            <given-names>DR</given-names>
          </name>
          <name name-style="western">
            <surname>Hébert-Dufresne</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Johansson</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Konty</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Lipsitch</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Milinovich</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Miller</surname>
            <given-names>JD</given-names>
          </name>
          <name name-style="western">
            <surname>Nsoesie</surname>
            <given-names>EO</given-names>
          </name>
          <name name-style="western">
            <surname>Olson</surname>
            <given-names>DR</given-names>
          </name>
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Polgreen</surname>
            <given-names>PM</given-names>
          </name>
          <name name-style="western">
            <surname>Priedhorsky</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Read</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Rodríguez-Barraquer</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Stefansen</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Swerdlow</surname>
            <given-names>DL</given-names>
          </name>
          <name name-style="western">
            <surname>Thompson</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Vespignani</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Wesolowski</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Enhancing disease surveillance with novel data streams: challenges and opportunities</article-title>
        <source>EPJ Data Sci</source>  
        <year>2015</year>  
        <volume>4</volume>  
        <fpage>-</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27990325"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1140/epjds/s13688-015-0054-0</pub-id>
        <pub-id pub-id-type="medline">27990325</pub-id>
        <pub-id pub-id-type="pmcid">PMC5156315</pub-id></nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Tumasjan</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Sprenger</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Sandner</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Welpe</surname>
            <given-names>I</given-names>
          </name>
        </person-group>
        <article-title>Predicting elections with twitter: What 140 characters reveal about political sentiment</article-title>
        <year>2010</year>  
        <conf-name>Fourth international AAAI conference on weblogs and social media</conf-name>
        <conf-date>2010</conf-date>
        <conf-loc>Washington, USA</conf-loc>
        <fpage>178</fpage>  
        <lpage>185</lpage> </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bermingham</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Smeaton</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>On using Twitter to monitor political sentiment and predict election results</article-title>
        <year>2011</year>  
        <conf-name>Proceedings of the Workshop on Sentiment Analysis where AI meets Psychology (SAAIP )</conf-name>
        <conf-date>2011</conf-date>
        <conf-loc>Chiang Mai, Thailand</conf-loc>
        <fpage>2</fpage>  
        <lpage>10</lpage> </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Asur</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Huberman</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Predicting the future with social media</article-title>
        <year>2010</year>  
        <conf-name>IEEE/WIC/ACM International Conference on Web Intelligence and Intelligent Agent Technology</conf-name>
        <conf-date>31 August-3 September, 2010</conf-date>
        <conf-loc>Toronto, ON, Canada</conf-loc>
        <fpage>492</fpage>  
        <lpage>99</lpage>  
        <pub-id pub-id-type="doi">10.1109/WI-IAT.2010.63</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Jain</surname>
            <given-names>V</given-names>
          </name>
        </person-group>
        <article-title>Prediction of movie success using sentiment analysis of tweets</article-title>
        <source>IJSCE</source>  
        <year>2013</year>  
        <volume>3</volume>  
        <issue>3</issue>  
        <fpage>308</fpage>  
        <lpage>13</lpage>  
        <pub-id pub-id-type="doi">10.7321/jscse.v3.n3.46</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pasek</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Yan</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Conrad</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Newport</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Marken</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>The stability of economic correlations over time: identifying conditions under which survey tracking polls and Twitter sentiment yield similar conclusions</article-title>
        <source>Public Opin Q</source>  
        <year>2018</year>  
        <volume>82</volume>  
        <issue>3</issue>  
        <fpage>470</fpage>  
        <lpage>92</lpage>  
        <pub-id pub-id-type="doi">10.1093/poq/nfy030</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bollen</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Mao</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Pepe</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Modeling public mood and emotion: Twitter sentiment and socio-economic phenomena</article-title>
        <source>Proceedings of the Fifth International AAAI Conference on Weblogs and Social Media</source>  
        <year>2011</year>  
        <conf-name>ICWSM 2011</conf-name>
        <conf-date>17-21 July, 2011</conf-date>
        <conf-loc>Barcelona,Spain</conf-loc>
        <fpage>450</fpage>  
        <lpage>53</lpage> </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Salathé</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Khandelwal</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Assessing vaccination sentiments with online social media: implications for infectious disease dynamics and control</article-title>
        <source>PLoS Comput Biol</source>  
        <year>2011</year>  
        <month>10</month>  
        <volume>7</volume>  
        <issue>10</issue>  
        <fpage>e1002199</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1002199"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pcbi.1002199</pub-id>
        <pub-id pub-id-type="medline">22022249</pub-id>
        <pub-id pub-id-type="pii">PCOMPBIOL-D-11-00652</pub-id>
        <pub-id pub-id-type="pmcid">PMC3192813</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Frank</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Mitchell</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Dodds</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Danforth</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Happiness and the patterns of life: a study of geolocated tweets</article-title>
        <source>Sci Rep</source>  
        <year>2013</year>  
        <volume>3</volume>  
        <fpage>2625</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.1038/srep02625"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1038/srep02625</pub-id>
        <pub-id pub-id-type="medline">24026340</pub-id>
        <pub-id pub-id-type="pii">srep02625</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Golder</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Macy</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Diurnal and seasonal mood vary with work, sleep, and daylength across diverse cultures</article-title>
        <source>Science</source>  
        <year>2011</year>  
        <month>09</month>  
        <day>30</day>  
        <volume>333</volume>  
        <issue>6051</issue>  
        <fpage>1878</fpage>  
        <lpage>81</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.sciencemag.org/cgi/pmidlookup?view=long&amp;pmid=21960633"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1126/science.1202775</pub-id>
        <pub-id pub-id-type="medline">21960633</pub-id>
        <pub-id pub-id-type="pii">333/6051/1878</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Coppersmith</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Harman</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Hollingshead</surname>
            <given-names>K</given-names>
          </name>
        </person-group>
        <source>Association for Computational Linguistics</source>  
        <year>2015</year>  
        <access-date>2019-04-17</access-date>
        <comment>From ADHD to SAD: Analyzing the Language of Mental Health on Twitter through Self-Reported Diagnoses 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aclweb.org/anthology/W15-1201">https://www.aclweb.org/anthology/W15-1201</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="77iU1VNnQ"/></comment> </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gore</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Diallo</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Padilla</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>You are what you Tweet: connecting the geographic variation in America's obesity rate to Twitter content</article-title>
        <source>PLoS One</source>  
        <year>2015</year>  
        <volume>10</volume>  
        <issue>9</issue>  
        <fpage>e0133505</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0133505"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0133505</pub-id>
        <pub-id pub-id-type="medline">26332588</pub-id>
        <pub-id pub-id-type="pii">PONE-D-15-02269</pub-id>
        <pub-id pub-id-type="pmcid">PMC4557976</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Super</surname>
            <given-names>DE</given-names>
          </name>
        </person-group>
        <article-title>A life-span, life-space approach to career development</article-title>
        <source>J Vocat Behav</source>  
        <year>1980</year>  
        <volume>16</volume>  
        <issue>3</issue>  
        <fpage>282</fpage>  
        <lpage>98</lpage>  
        <pub-id pub-id-type="doi">10.1016/0001-8791(80)90056-1</pub-id></nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Stone</surname>
            <given-names>AA</given-names>
          </name>
          <name name-style="western">
            <surname>Schneider</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Harter</surname>
            <given-names>JK</given-names>
          </name>
        </person-group>
        <article-title>Day-of-week mood patterns in the United States: on the existence of ‘Blue Monday’, ‘Thank God it's Friday’ and weekend effects</article-title>
        <source>J Posit Psychol</source>  
        <year>2012</year>  
        <volume>7</volume>  
        <issue>4</issue>  
        <fpage>306</fpage>  
        <lpage>14</lpage>  
        <pub-id pub-id-type="doi">10.1080/17439760.2012.691980</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Egloff</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Tausch</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Kohlmann</surname>
            <given-names>CW</given-names>
          </name>
          <name name-style="western">
            <surname>Krohne</surname>
            <given-names>HW</given-names>
          </name>
        </person-group>
        <article-title>Relationships between time of day, day of the week, and positive mood: exploring the role of the mood measure</article-title>
        <source>Motiv Emot</source>  
        <year>1995</year>  
        <volume>19</volume>  
        <issue>2</issue>  
        <fpage>99</fpage>  
        <lpage>110</lpage>  
        <pub-id pub-id-type="doi">10.1007/BF02250565</pub-id></nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Howarth</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Hoffman</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>A multidimensional approach to the relationship between mood and weather</article-title>
        <source>Br J Psychol</source>  
        <year>1984</year>  
        <month>02</month>  
        <volume>75</volume>  
        <issue>Pt 1</issue>  
        <fpage>15</fpage>  
        <lpage>23</lpage>  
        <pub-id pub-id-type="medline">6704634</pub-id></nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Denissen</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Butalid</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Penke</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>van Aken</surname>
            <given-names>MA</given-names>
          </name>
        </person-group>
        <article-title>The effects of weather on daily mood: a multilevel approach</article-title>
        <source>Emotion</source>  
        <year>2008</year>  
        <month>10</month>  
        <volume>8</volume>  
        <issue>5</issue>  
        <fpage>662</fpage>  
        <lpage>7</lpage>  
        <pub-id pub-id-type="doi">10.1037/a0013497</pub-id>
        <pub-id pub-id-type="medline">18837616</pub-id>
        <pub-id pub-id-type="pii">2008-13989-008</pub-id></nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Klimstra</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Frijns</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Keijsers</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Denissen</surname>
            <given-names>JJ</given-names>
          </name>
          <name name-style="western">
            <surname>Raaijmakers</surname>
            <given-names>QA</given-names>
          </name>
          <name name-style="western">
            <surname>van Aken</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Koot</surname>
            <given-names>HM</given-names>
          </name>
          <name name-style="western">
            <surname>van Lier</surname>
            <given-names>PA</given-names>
          </name>
          <name name-style="western">
            <surname>Meeus</surname>
            <given-names>WH</given-names>
          </name>
        </person-group>
        <article-title>Come rain or come shine: individual differences in how weather affects mood</article-title>
        <source>Emotion</source>  
        <year>2011</year>  
        <month>12</month>  
        <volume>11</volume>  
        <issue>6</issue>  
        <fpage>1495</fpage>  
        <lpage>9</lpage>  
        <pub-id pub-id-type="doi">10.1037/a0024649</pub-id>
        <pub-id pub-id-type="medline">21842988</pub-id>
        <pub-id pub-id-type="pii">2011-18046-001</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Baylis</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <source>Energy Institute at HAAS</source>  
        <year>2015</year>  
        <access-date>2019-04-18</access-date>
        <comment>Temperature and Temperament: Evidence from a Billion Tweets 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://ei.haas.berkeley.edu/research/papers/WP265.pdf">https://ei.haas.berkeley.edu/research/papers/WP265.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="77iVouI2S"/></comment> </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Berry</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Hansen</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Positive affect, negative affect, and social interaction</article-title>
        <source>J Pers Soc Psychol</source>  
        <year>1996</year>  
        <volume>71</volume>  
        <issue>4</issue>  
        <fpage>796</fpage>  
        <lpage>809</lpage>  
        <pub-id pub-id-type="doi">10.1037/0022-3514.71.4.796</pub-id></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Dodds</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Harris</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Kloumann</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Bliss</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Danforth</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Temporal patterns of happiness and information in a global social network: hedonometrics and Twitter</article-title>
        <source>PLoS One</source>  
        <year>2011</year>  
        <volume>6</volume>  
        <issue>12</issue>  
        <fpage>e26752</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0026752"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0026752</pub-id>
        <pub-id pub-id-type="medline">22163266</pub-id>
        <pub-id pub-id-type="pii">PONE-D-11-01360</pub-id>
        <pub-id pub-id-type="pmcid">PMC3233600</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>O'Connor</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Balasubramanyan</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Routledge</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>N</given-names>
          </name>
        </person-group>
        <source>Association for the Advancement of Artificial Intelligence</source>  
        <year>2010</year>  
        <access-date>2019-04-18</access-date>
        <comment>From tweets to polls: Linking text sentiment to public opinion time series 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aaai.org/ocs/index.php/ICWSM/ICWSM10/paper/viewFile/1536/1842">https://www.aaai.org/ocs/index.php/ICWSM/ICWSM10/paper/viewFile/1536/1842</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="77iVzqWLO"/></comment> </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Larsen</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Boonstra</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Batterham</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>O'Dea</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Paris</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Christensen</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>We feel: mapping emotion on Twitter</article-title>
        <source>IEEE J Biomed Health Inform</source>  
        <year>2015</year>  
        <volume>19</volume>  
        <issue>4</issue>  
        <fpage>1246</fpage>  
        <lpage>52</lpage>  
        <pub-id pub-id-type="doi">10.1109/JBHI.2015.2403839</pub-id></nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Mitchell</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Frank</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Harris</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Dodds</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Danforth</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>The geography of happiness: connecting twitter sentiment and expression, demographics, and objective characteristics of place</article-title>
        <source>PLoS One</source>  
        <year>2013</year>  
        <volume>8</volume>  
        <issue>5</issue>  
        <fpage>e64417</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0064417"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0064417</pub-id>
        <pub-id pub-id-type="medline">23734200</pub-id>
        <pub-id pub-id-type="pii">PONE-D-13-07723</pub-id>
        <pub-id pub-id-type="pmcid">PMC3667195</pub-id></nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Park</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Park</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Park</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Cha</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <source>Association for the Advancement of Artificial Intelligence</source>  
        <year>2013</year>  
        <access-date>2019-04-18</access-date>
        <comment>Mood and weather: Feeling the heat? 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aaai.org/ocs/index.php/ICWSM/ICWSM13/paper/view/6068/6330">https://www.aaai.org/ocs/index.php/ICWSM/ICWSM13/paper/view/6068/6330</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="77iWC82Tl"/></comment> </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hannak</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Anderson</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Barrett</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Lehmann</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Mislove</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Riedewald</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <source>Association for the Advancement of Artificial Intelligence</source>  
        <year>2012</year>  
        <access-date>2019-04-18</access-date>
        <comment>Tweetin’ in the Rain: Exploring Societal-scale Effects of Weather on Mood 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.ccs.neu.edu/home/amislove/publications/Weather-ICWSM.pdf">http://www.ccs.neu.edu/home/amislove/publications/Weather-ICWSM.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="77iWHGNe6"/></comment> </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Hovy</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>What a Nasty Day: Exploring Mood-Weather Relationship from Twitter</article-title>
        <source>Proceedings of the 23rd ACM International Conference on Conference on Information and Knowledge Management</source>  
        <year>2014</year>  
        <conf-name>CIKM '14</conf-name>
        <conf-date>November 03-07, 2014</conf-date>
        <conf-loc>Shanghai, China</conf-loc>
        <fpage>1309</fpage>  
        <lpage>18</lpage>  
        <pub-id pub-id-type="doi">10.1145/2661829.2662090</pub-id></nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Padilla</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Kavak</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Lynch</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Gore</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Diallo</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Temporal and spatiotemporal investigation of tourist attraction visit sentiment on Twitter</article-title>
        <source>PLoS One</source>  
        <year>2018</year>  
        <volume>13</volume>  
        <issue>6</issue>  
        <fpage>e0198857</fpage>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0198857</pub-id>
        <pub-id pub-id-type="medline">29902270</pub-id>
        <pub-id pub-id-type="pii">PONE-D-18-02998</pub-id>
        <pub-id pub-id-type="pmcid">PMC6002102</pub-id></nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Giachanou</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Crestani</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <article-title>Like it or not: a survey of Twitter sentiment analysis methods</article-title>
        <source>ACM Comput Surv</source>  
        <year>2016</year>  
        <volume>49</volume>  
        <issue>2</issue>  
        <fpage>-</fpage>  
        <pub-id pub-id-type="doi">10.1145/2938640</pub-id></nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Mahmud</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Nichols</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Drews</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Home location identification of twitter users</article-title>
        <source>ACM Trans Intell Syst Technol</source>  
        <year>2014</year>  
        <volume>5</volume>  
        <issue>3</issue>  
        <fpage>-</fpage>  
        <pub-id pub-id-type="doi">10.1145/2528548</pub-id></nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Rahimi</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Cohn</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Baldwin</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <source>Association for Computational Linguistics</source>  
        <year>2015</year>  
        <access-date>2019-04-18</access-date>
        <comment>Twitter User Geolocation Using a Unified Text and Network Prediction Model 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aclweb.org/anthology/P15-2104">https://www.aclweb.org/anthology/P15-2104</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="77iWeiIQq"/></comment> </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="web">
        <source>Open Weather Map</source>  
        <access-date>2018-11-22</access-date>
        <comment>Weather API 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://openweathermap.org/api">https://openweathermap.org/api</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="746qWakXy"/></comment> </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ravi</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Ravi</surname>
            <given-names>V</given-names>
          </name>
        </person-group>
        <article-title>A survey on opinion mining and sentiment analysis: tasks, approaches and applications</article-title>
        <source>Knowl Based Syst</source>  
        <year>2015</year>  
        <volume>89</volume>  
        <fpage>14</fpage>  
        <lpage>46</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.knosys.2015.06.015</pub-id></nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ribeiro</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Araújo</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Gonçalves</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Gonçalves</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Benevenuto</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <article-title>Sentibench-a benchmark comparison of state-of-the-practice sentiment analysis methods</article-title>
        <source>EPJ Data Sci</source>  
        <year>2016</year>  
        <volume>5</volume>  
        <fpage>23</fpage>  
        <pub-id pub-id-type="doi">10.1140/epjds/s13688-016-0085-1</pub-id></nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Reagan</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Danforth</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Tivnan</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Williams</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Dodds</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>Sentiment analysis methods for understanding large-scale texts: a case for using continuum-scored words and word shift graphs</article-title>
        <source>EPJ Data Sci</source>  
        <year>2017</year>  
        <volume>6</volume>  
        <fpage>28</fpage>  
        <pub-id pub-id-type="doi">10.1140/epjds/s13688-017-0121-9</pub-id></nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Thelwall</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Buckley</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Paltoglou</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Cai</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Kappas</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Sentiment strength detection in short informal text</article-title>
        <source>J Assoc Inf Sci Technol</source>  
        <year>2010</year>  
        <volume>61</volume>  
        <issue>12</issue>  
        <fpage>2544</fpage>  
        <lpage>58</lpage> </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gonçalves</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Araújo</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Benevenuto</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Cha</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Comparing and combining sentiment analysis methods</article-title>
        <source>Proceedings of the first ACM conference on Online social networks</source>  
        <year>2013</year>  
        <conf-name>COSN '13</conf-name>
        <conf-date>October 07-08, 2013</conf-date>
        <conf-loc>Boston, Massachusetts, USA</conf-loc>
        <fpage>27</fpage>  
        <lpage>38</lpage> </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Thelwall</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Buckley</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Paltoglou</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Sentiment in Twitter events</article-title>
        <source>J Assoc Inf Sci Technol</source>  
        <year>2011</year>  
        <volume>62</volume>  
        <issue>2</issue>  
        <fpage>406</fpage>  
        <lpage>18</lpage> </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Thelwall</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <source>University of Wolverhampton</source>  
        <year>2014</year>  
        <access-date>2019-04-18</access-date>
        <comment>Sentiment analysis and time series with Twitter 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://mozdeh.wlv.ac.uk/resources/TwitterTimeSeriesAndSentimentAnalysis.pdf">http://mozdeh.wlv.ac.uk/resources/TwitterTimeSeriesAndSentimentAnalysis.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="77iXpW733"/></comment> </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Alves</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>de Souza</surname>
            <given-names>BC</given-names>
          </name>
          <name name-style="western">
            <surname>Firmino</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>de Oliveira</surname>
            <given-names>MG</given-names>
          </name>
          <name name-style="western">
            <surname>de Paiva</surname>
            <given-names>AC</given-names>
          </name>
        </person-group>
        <article-title>A spatial and temporal sentiment analysis approach applied to Twitter microtexts</article-title>
        <source>JIDM</source>  
        <year>2016</year>  
        <volume>6</volume>  
        <issue>2</issue>  
        <fpage>118</fpage>  
        <lpage>29</lpage> </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Balog</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Mishne</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>De Rijke</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Why are they excited?: identifying and explaining spikes in blog mood levels</article-title>
        <source>Proceedings of the Eleventh Conference of the European Chapter of the Association for Computational Linguistics: Posters &amp; Demonstrations</source>  
        <year>2006</year>  
        <conf-name>EACL '06</conf-name>
        <conf-date>April 05-06, 2006</conf-date>
        <conf-loc>Trento, Italy</conf-loc>
        <fpage>207</fpage>  
        <lpage>10</lpage> </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bollen</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Mao</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Zeng</surname>
            <given-names>X</given-names>
          </name>
        </person-group>
        <article-title>Twitter mood predicts the stock market</article-title>
        <source>J Comput Sci</source>  
        <year>2011</year>  
        <volume>2</volume>  
        <issue>1</issue>  
        <fpage>1</fpage>  
        <lpage>8</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.jocs.2010.12.007</pub-id></nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Antweiler</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Frank</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Is all that talk just noise? The information content of internet stock message boards</article-title>
        <source>J Finance</source>  
        <year>2004</year>  
        <volume>59</volume>  
        <issue>3</issue>  
        <fpage>1259</fpage>  
        <lpage>94</lpage> </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Adam</surname>
            <given-names>DI</given-names>
          </name>
        </person-group>
        <article-title>An unobtrusive behavioral model of "gross national happiness"</article-title>
        <source>Proceedings of the SIGCHI conference on human factors in computing systems</source>  
        <year>2010</year>  
        <conf-name>CHI '10</conf-name>
        <conf-date>April 10-15, 2010</conf-date>
        <conf-loc>Atlanta, Georgia, USA</conf-loc></nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Eric</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Karrie</surname>
            <given-names>K</given-names>
          </name>
        </person-group>
        <article-title>Widespread Worry and the Stock Market</article-title>
        <year>2010</year>  
        <conf-name>Proceedings of the International Conference on Weblogs and Social</conf-name>
        <conf-date>2010</conf-date>
        <conf-loc>Washington, USA</conf-loc></nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Diener</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Emmons</surname>
            <given-names>R</given-names>
          </name>
        </person-group>
        <article-title>The independence of positive and negative affect</article-title>
        <source>J Pers Soc Psychol</source>  
        <year>1984</year>  
        <month>11</month>  
        <volume>47</volume>  
        <issue>5</issue>  
        <fpage>1105</fpage>  
        <lpage>17</lpage>  
        <pub-id pub-id-type="medline">6520704</pub-id></nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Clark</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Watson</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Mood and the mundane: relations between daily life events and self-reported mood</article-title>
        <source>J Pers Soc Psychol</source>  
        <year>1988</year>  
        <month>02</month>  
        <volume>54</volume>  
        <issue>2</issue>  
        <fpage>296</fpage>  
        <lpage>308</lpage>  
        <pub-id pub-id-type="medline">3346815</pub-id></nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bollen</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Gonçalves</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>van de Leemput</surname>
            <given-names>I</given-names>
          </name>
          <name name-style="western">
            <surname>Ruan</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>The happiness paradox: your friends are happier than you</article-title>
        <source>EPJ Data Sci</source>  
        <year>2017</year>  
        <volume>6</volume>  
        <issue>1</issue>  
        <fpage>4</fpage>  
        <pub-id pub-id-type="doi">10.1140/epjds/s13688-017-0100-1</pub-id></nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Burnap</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Williams</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Us and them: identifying cyber hate on Twitter across multiple protected characteristics</article-title>
        <source>EPJ Data Sci</source>  
        <year>2016</year>  
        <volume>5</volume>  
        <fpage>11</fpage> </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>An</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Quercia</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Cha</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Gummadi</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Crowcroft</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Sharing political news: the balancing act of intimacy and socialization in selective exposure</article-title>
        <source>EPJ Data Sci</source>  
        <year>2014</year>  
        <volume>3</volume>  
        <fpage>12</fpage>  
        <pub-id pub-id-type="doi">10.1140/epjds/s13688-014-0012-2</pub-id></nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Salathé</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Vu</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Khandelwal</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Hunter</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>The dynamics of health behavior sentiments on a large online social network</article-title>
        <source>EPJ Data Sci</source>  
        <year>2013</year>  
        <volume>2</volume>  
        <fpage>4</fpage>  
        <pub-id pub-id-type="doi">10.1140/epjds16</pub-id></nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Volkova</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Charles</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Harrison</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Corley</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>Uncovering the relationships between military community health and affects expressed in social media</article-title>
        <source>EPJ Data Sci</source>  
        <year>2017</year>  
        <volume>6</volume>  
        <fpage>9</fpage>  
        <pub-id pub-id-type="doi">10.1140/epjds/s13688-017-0102-z</pub-id></nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Dunn</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Coiera</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Social media interventions for precision public health: promises and risks</article-title>
        <source>NPJ Digit Med</source>  
        <year>2018</year>  
        <volume>1</volume>  
        <fpage>-</fpage>  
        <pub-id pub-id-type="doi">10.1038/s41746-018-0054-0</pub-id></nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sloan</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Morgan</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Who tweets with their location? Understanding the relationship between demographic characteristics and the use of Geoservices and Geotagging on Twitter</article-title>
        <source>PLoS One</source>  
        <year>2015</year>  
        <volume>10</volume>  
        <issue>11</issue>  
        <fpage>e0142209</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0142209"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0142209</pub-id>
        <pub-id pub-id-type="medline">26544601</pub-id>
        <pub-id pub-id-type="pii">PONE-D-15-35431</pub-id>
        <pub-id pub-id-type="pmcid">PMC4636345</pub-id></nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sloan</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Morgan</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Burnap</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Williams</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Who tweets? Deriving the demographic characteristics of age, occupation and social class from Twitter user meta-data</article-title>
        <source>PloS one</source>  
        <year>2015</year>  
        <volume>10</volume>  
        <issue>3</issue>  
        <fpage>e0115545</fpage>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0115545</pub-id></nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Mislove</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Lehmann</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Ahn</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Onnela</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Rosenquist</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Understanding the Demographics of Twitter Users</article-title>
        <source>Proceedings of the Fifth International AAAI Conference on Weblogs and Social Media</source>  
        <year>2011</year>  
        <conf-name>AAAI Press</conf-name>
        <conf-date>2011</conf-date>
        <conf-loc>Barcelona, Spain</conf-loc>
        <fpage>554</fpage>  
        <lpage>57</lpage> </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sadah</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Shahbazi</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Wiley</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Hristidis</surname>
            <given-names>V</given-names>
          </name>
        </person-group>
        <article-title>A study of the demographics of web-based health-related social media users</article-title>
        <source>J Med Internet Res</source>  
        <year>2015</year>  
        <month>08</month>  
        <day>06</day>  
        <volume>17</volume>  
        <issue>8</issue>  
        <fpage>e194</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2015/8/e194/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.4308</pub-id>
        <pub-id pub-id-type="medline">26250986</pub-id>
        <pub-id pub-id-type="pii">v17i8e194</pub-id>
        <pub-id pub-id-type="pmcid">PMC4705027</pub-id></nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Malik</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Lamba</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Nakos</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Pfeffer</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Population bias in Geotagged tweets</article-title>
        <year>2015</year>  
        <conf-name>Ninth International AAAI Conference on Web and Social Media</conf-name>
        <conf-date>May 26–29, 2015</conf-date>
        <conf-loc>Oxford, England</conf-loc>
        <fpage>531</fpage> </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Szabo</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Sheng</surname>
            <given-names>Q</given-names>
          </name>
        </person-group>
        <article-title>Sense and focus: towards effective location inference and event detection on Twitter</article-title>
        <year>2015</year>  
        <conf-name>International Conference on Web Information Systems Engineering</conf-name>
        <conf-date>2015</conf-date>
        <conf-loc>Miami, FL, USA</conf-loc>
        <fpage>463</fpage>  
        <lpage>77</lpage>  
        <pub-id pub-id-type="doi">10.1007/978-3-319-26190-4_31</pub-id></nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Compton</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Jurgens</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Allen</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Geotagging one hundred million twitter accounts with total variation minimization</article-title>
        <year>2014</year>  
        <conf-name>2014 IEEE International Conference on Big Data (Big Data)</conf-name>
        <conf-date>October 27-30, 2014</conf-date>
        <conf-loc>Washington, USA</conf-loc>
        <fpage>393</fpage>  
        <lpage>401</lpage>  
        <pub-id pub-id-type="doi">10.1109/BigData.2014.7004256</pub-id></nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Jurgens</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <source>HRL Laboratories</source>  
        <year>2013</year>  
        <access-date>2019-04-18</access-date>
        <comment>That's What Friends Are For: Inferring Location in Online Social Media Platforms Based on Social Relationships 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://jurgens.people.si.umich.edu/docs/icwsm-2013-slides.pdf">http://jurgens.people.si.umich.edu/docs/icwsm-2013-slides.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="77iZOwXyC"/></comment> </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ajao</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Hong</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>W</given-names>
          </name>
        </person-group>
        <article-title>A survey of location inference techniques on Twitter</article-title>
        <source>J Inf Sci</source>  
        <year>2015</year>  
        <volume>41</volume>  
        <issue>6</issue>  
        <fpage>855</fpage>  
        <lpage>64</lpage>  
        <pub-id pub-id-type="doi">10.1177/0165551515602847</pub-id></nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Koto</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Adriani</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>A comparative study on twitter sentiment analysis: Which features are good?</article-title>
        <year>2015</year>  
        <conf-name>International Conference on Applications of Natural Language to Information System</conf-name>
        <conf-date>2015</conf-date>
        <conf-loc>Salford, United Kingdom</conf-loc>
        <fpage>453</fpage>  
        <lpage>57</lpage>  
        <pub-id pub-id-type="doi">10.1007/978-3-319-19581-0_46</pub-id></nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Saif</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Fernandez</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>He</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Alani</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Evaluation datasets for Twitter sentiment analysis: a survey and a new dataset, the STS-Gold</article-title>
        <year>2013</year>  
        <conf-name>1st Interantional Workshop on Emotion and Sentiment in Social and Expressive Media: Approaches and Perspectives from AI (ESSEM 2013)</conf-name>
        <conf-date>December 3, 2013</conf-date>
        <conf-loc>Turin, Italy</conf-loc></nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gonçalves</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Dalip</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Costa</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Gonçalves</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Benevenuto</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <article-title>On the combination of "off-the-shelf" sentiment analysis methods</article-title>
        <source>Proceedings of the 31st Annual ACM Symposium on Applied Computing</source>  
        <year>2016</year>  
        <conf-name>SAC '16</conf-name>
        <conf-date>April 04-08, 2016</conf-date>
        <conf-loc>Pisa, Italy</conf-loc>
        <fpage>1158</fpage>  
        <lpage>65</lpage> </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yan</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>HM</given-names>
          </name>
        </person-group>
        <article-title>Two simple and effective ensemble classifiers for Twitter sentiment analysis</article-title>
        <year>2017</year>  
        <conf-name>2017 Computing Conference</conf-name>
        <conf-date>July 18-20, 2017</conf-date>
        <conf-loc>London, UK</conf-loc>
        <fpage>1386</fpage>  
        <lpage>93</lpage>  
        <pub-id pub-id-type="doi">10.1109/SAI.2017.8252275</pub-id></nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Atefeh</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Khreich</surname>
            <given-names>W</given-names>
          </name>
        </person-group>
        <article-title>A survey of techniques for event detection in twitter</article-title>
        <source>Comput Intell</source>  
        <year>2015</year>  
        <volume>31</volume>  
        <issue>1</issue>  
        <fpage>132</fpage>  
        <lpage>64</lpage>  
        <pub-id pub-id-type="doi">10.1111/coin.12017</pub-id></nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Weng</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>BS</given-names>
          </name>
        </person-group>
        <article-title>Event detection in Twitter</article-title>
        <source>Proceedings of the 2nd International Workshop on Social Computing</source>  
        <year>2011</year>  
        <conf-name>IWSC '18</conf-name>
        <conf-date>2011</conf-date>
        <conf-loc>Barcelona, Spain</conf-loc>
        <fpage>401</fpage>  
        <lpage>08</lpage> </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
