<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v21i6e12394</article-id>
      <article-id pub-id-type="pmid">31162126</article-id>
      <article-id pub-id-type="doi">10.2196/12394</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Monitoring Physical Activity Levels Using Twitter Data: Infodemiology Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Stetten</surname>
            <given-names>Nichole</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Gore</surname>
            <given-names>Ross</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="author" id="contrib1" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Sam</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>School of Exercise Science, Physical and Health Education</institution>
            <institution>University of Victoria</institution>
            <addr-line>McKinnon Building 124</addr-line>
            <addr-line>Victoria, BC, V8W 2Y2</addr-line>
            <country>Canada</country>
            <phone>1 250 721 8392</phone>
            <email>samliu@uvic.ca</email>
          </address>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-2364-7774</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib2">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Brian</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-7655-6986</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib3">
          <name name-style="western">
            <surname>Kuo</surname>
            <given-names>Alex</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-4996-5578</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
      <label>1</label>
      <institution>School of Exercise Science, Physical and Health Education</institution>
      <institution>University of Victoria</institution>  
      <addr-line>Victoria, BC</addr-line>
      <country>Canada</country></aff>
      <aff id="aff2">
      <label>2</label>
      <institution>Department of Health Information Science</institution>
      <institution>University of Victoria</institution>  
      <addr-line>Victoria, BC</addr-line>
      <country>Canada</country></aff>
      <author-notes>
        <corresp>Corresponding Author: Sam Liu 
        <email>samliu@uvic.ca</email></corresp>
      </author-notes>
      <pub-date pub-type="collection"><month>06</month><year>2019</year></pub-date>
      <pub-date pub-type="epub">
        <day>03</day>
        <month>06</month>
        <year>2019</year>
      </pub-date>
      <volume>21</volume>
      <issue>6</issue>
      <elocation-id>e12394</elocation-id>
      <!--history from ojs - api-xml-->
      <history>
        <date date-type="received">
          <day>16</day>
          <month>10</month>
          <year>2018</year>
        </date>
        <date date-type="rev-request">
          <day>3</day>
          <month>2</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>12</day>
          <month>4</month>
          <year>2019</year>
        </date>
        <date date-type="accepted">
          <day>14</day>
          <month>4</month>
          <year>2019</year>
        </date>
      </history>
      <copyright-statement>©Sam Liu, Brian Chen, Alex Kuo. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 03.06.2019.</copyright-statement>
      <copyright-year>2019</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2019/6/e12394/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Social media technology such as Twitter allows users to share their thoughts, feelings, and opinions online. The growing body of social media data is becoming a central part of infodemiology research as these data can be combined with other public health datasets (eg, physical activity levels) to provide real-time monitoring of psychological and behavior outcomes that inform health behaviors. Currently, it is unclear whether Twitter data can be used to monitor physical activity levels.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to establish the feasibility of using Twitter data to monitor physical activity levels by assessing whether the frequency and sentiment of physical activity–related tweets were associated with physical activity levels across the United States.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Tweets were collected from Twitter’s application programming interface (API) between January 10, 2017 and January 2, 2018. We used Twitter's <italic>garden hose</italic> method of collecting tweets, which provided a random sample of approximately 1% of all tweets with location metadata falling within the United States. Geotagged tweets were filtered. A list of physical activity–related hashtags was collected and used to further classify these geolocated tweets. Twitter data were merged with physical activity data collected as part of the Behavioral Risk Factor Surveillance System. Multiple linear regression models were fit to assess the relationship between physical activity–related tweets and physical activity levels by county while controlling for population and socioeconomic status measures.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>During the study period, 442,959,789 unique tweets were collected, of which 64,005,336 (14.44%) were geotagged with latitude and longitude coordinates. Aggregated data were obtained for a total of 3138 counties in the United States. The mean county-level percentage of physically active individuals was 74.05% (SD 5.2) and 75.30% (SD 4.96) after adjusting for age. The model showed that the percentage of physical activity–related tweets was significantly associated with physical activity levels (beta=.11; SE 0.2; <italic>P</italic>&lt;.001) and age-adjusted physical activity (beta=.10; SE 0.20; <italic>P</italic>&lt;.001) on a county level while adjusting for both Gini index and education level. However, the overall explained variance of the model was low (<italic>R</italic><sup>2</sup>=.11). The sentiment of the physical activity–related tweets was not a significant predictor of physical activity level and age-adjusted physical activity on a county level after including the Gini index and education level in the model (<italic>P</italic>&gt;.05).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Social media data may be a valuable tool for public health organizations to monitor physical activity levels, as it can overcome the time lag in the reporting of physical activity epidemiology data faced by traditional research methods (eg, surveys and observational studies). Consequently, this tool may have the potential to help public health organizations better mobilize and target physical activity interventions.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>physical activity</kwd>
        <kwd>social media</kwd>
        <kwd>internet</kwd>
        <kwd>social media</kwd>
        <kwd>Twitter messaging</kwd>
        <kwd>population surveillance</kwd>
        <kwd>public health</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Physical inactivity is a modifiable risk factor for developing a widening variety of chronic conditions including cardiovascular diseases, hypertension, type 2 diabetes mellitus, colon cancers, osteoporosis, and depression [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref5">5</xref>]. Currently, many adults in the United States are physically inactive and do not meet the recommended amount of physical activity (150 min of moderate-intensity aerobic exercise per week) [<xref ref-type="bibr" rid="ref6">6</xref>]. Furthermore, the prevalence of physical activity varies across geographic regions in the United States [<xref ref-type="bibr" rid="ref7">7</xref>]. This lack of uniformity in the rate of physical activity in various geographic regions has become one of the top priorities for public health agencies—to collect population-level physical activity data. This epidemiology data can help identify groups and populations who are not engaged in regular physical activity and locations where these individuals live [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. Local public health agencies can use this information to deploy appropriate resources to target health promotion efforts to improve physical activity levels in physically inactive regions. In fact, several studies have demonstrated the feasibility of using social media and internet-based interventions to promote physical activity on a population level [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref15">15</xref>]. Real-time epidemiology data of groups and locations of individuals who are not engaged in regular physical activity may further enhance public health agencies’ capabilities to personalize and target their interventions.</p>
        <p>Existing methods of using population-based survey studies to monitor physical activity need to be improved. There are several limitations in current methods of collecting physical activity data [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. First, reporting physical activity survey data in the United States involves up to 2 to 3 years of lag time, whereas surveys themselves can be time-consuming and resource-intensive to conduct. Sparsity of data can be challenging for many surveys, as response rates may not vary uniformly by location, demographics, or population. Therefore, innovative research approaches are needed to supplement and improve the current state of physical activity monitoring.</p>
        <p>Social media use has grown rapidly in the last decade, [<xref ref-type="bibr" rid="ref17">17</xref>] and researchers have been examining ways to use <italic>social data</italic> to better understand and monitor public health problems in <italic>real-time</italic> [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. This growing area of research has been called <italic>infodemiology</italic> or <italic>infoveillance</italic> studies [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Social media technology, such as Twitter, allows users to communicate with each other by sharing short messages. Users can share their thoughts, feelings, and opinions on these social media platforms and, as a result, social media data may be used to provide real-time monitoring of behavioral outcomes that inform health behaviors [<xref ref-type="bibr" rid="ref21">21</xref>]. A unique aspect of social media data from Twitter is that the posts are public and geotagged and thus, all internet users, including health researchers, can readily access these data. In addition, unique to Twitter is the use of hashtags (<italic>#</italic>) that allow a user to highlight and allow other users to follow relevant topics of interest. Given their high level of use, these sites collect an enormous amount of data (eg, over 500 million tweets per day on Twitter) [<xref ref-type="bibr" rid="ref21">21</xref>].</p>
        <p>Recent infodemiology studies have reported that data from social media technologies can be combined with other biomedical datasets to help predict health outcomes [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref25">25</xref>]. The main approaches to analyze unstructured text data from Twitter include frequency of keyword occurrence (analysis of information prevalence and information occurrence ratio) and the sentiment of the tweets [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. These approaches are not mutually exclusive and thus can be used together for monitoring physical activity. Information prevalence and information occurrence ratios measure the absolute or relative <italic>frequency</italic> of occurrences of a certain keyword. The amount of social data is constantly increasing; thus, normalized indicators (eg, information occurrence ratio) may be more meaningful than absolute figures on information prevalence [<xref ref-type="bibr" rid="ref19">19</xref>]. Finally, sentiment analysis can determine whether an individual’s attitude or perception toward a topic is positive, negative, or neutral. By applying these methods, researchers have shown that social data can be used to identify symptoms associated with psychological distress, anxiety, and depression [<xref ref-type="bibr" rid="ref22">22</xref>] and identify infectious disease outbreaks, such as influenza transmission [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>] and HIV outbreaks [<xref ref-type="bibr" rid="ref24">24</xref>]. Previous studies have also reported that the frequency of physical activity–related tweets and the sentiment of the tweets are related to obesity rates [<xref ref-type="bibr" rid="ref28">28</xref>], social disparity, and wellness indicators in US Metropolitan Statistical Areas (MSAs) [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. Currently, it remains unclear whether these methods of analyzing physical activity–related tweets can be applied to monitor the physical activity level on a county level across the United States while controlling for socioeconomic inequality and education level.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>The aim of this study was to establish the feasibility of using Twitter data to monitor physical activity levels by assessing whether the frequency and sentiment of physical activity–related tweets were associated with physical activity levels in various counties across the United States.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview</title>
        <p>Tweets (n=442,959,789) were collected from January 10, 2017, to January 2, 2018, using Twitter’s application programming interface (API). The captured tweets represent an estimated 1% random selection of all tweets posted in a selected time frame. Only <italic>geolocated</italic> tweets with coordinates or within the bounding box defined by –162.354635, 18.756125, –53.755999, 73.893030 were retained for analysis. Additional processing was applied to filter out tweets with coordinates not originating from the United States, leaving a final sample of 64,005,336 tweets. To categorize tweets on a county level, a reverse-geocoding pipeline using cartographic boundary shapefiles from the US Census Bureau was created to assign a Federal Information Processing Standard code for each tweet.</p>
      </sec>
      <sec>
        <title>Classifying Physical Activity–Related Tweets</title>
        <p>A list of physical activity–related hashtags was compiled (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>) to identify tweets that might be related to exercise or physical activity. The hashtags were compiled using a combination of the most popular physical activity–related hashtags and the guidelines for exercise testing published by the American College of Sports Medicine (ACSM) [<xref ref-type="bibr" rid="ref31">31</xref>]. The ACSM guideline was used because it provided an extensive list of physical activity–related keywords that were well established, and this method has been used in previous research [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. A tweet was classified as a physical activity–related tweet if it contained one or more physical activity–related keyword in the tweet’s hashtags. Although previous studies have relied on dictionaries of exercise-related keywords (eg, from the Compendium of Physical Activities and ACSM guidelines for exercise testing) to classify tweets, using hashtags presents a couple of important advantages: they can be parsed as distinct entities from tweets and can represent more specific multi-word phrases [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. As such, there is less risk of ambiguity with hashtags than with a dictionary or list of keywords (eg, <italic>walk</italic> and <italic>surf</italic> may have multiple meanings outside of physical activity, whereas <italic>#30daysoffitness</italic> is unlikely to). Previous research has also discussed the difficulty of this classification task, either electing to improve precision by imposing additional rules (eg, requiring additional context for commonly ambiguous terms such as <italic>running</italic>) on top of the basic dictionary word check list or choosing not to apply any additional filtering to avoid introducing additional biases into the sampling methodology [<xref ref-type="bibr" rid="ref29">29</xref>]. Although using hashtags does not rectify the issue of curation bias, it does allow for far more specific matching against text than regular words, while also maintaining the simplicity of a simple list of items. This inherently trades off increased precision at the loss of recall or sensitivity but ensures that fewer unrelated tweets are passed to the sentiment analysis pipeline.</p>
      </sec>
      <sec>
        <title>Sentiment Analysis</title>
        <p>Using sentiment analysis techniques to study microblogging services such as Twitter is a rich and active area of study. Sentiment analysis assigns text documents polarities, labels such as <italic>positive</italic>, <italic>negative</italic>, and <italic>neutral</italic> that describe the writer’s attitude as written. When applied to a topic, sentiment analysis may be used to predict or infer these attitudes based primarily on a collection of documents. This study utilized a sentiment analysis model created by Baziotis, Pelekis, and Doulkeridis for the 2017 International Workshop on Semantic Evaluation (SemEval) [<xref ref-type="bibr" rid="ref32">32</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]. This model ranked first in Subtask A of Task 4 (<italic>Sentiment Analysis in Twitter</italic>) at SemEval 2017 and employs a bidirectional long short-term memory neural network with an attention mechanism [<xref ref-type="bibr" rid="ref34">34</xref>].</p>
      </sec>
      <sec>
        <title>Physical Activity Dataset</title>
        <p>Physical activity levels and age-adjusted physical activity levels were extracted from the Behavioral Risk Factor Surveillance System (BRFSS) surveys, which provides county-level data of physical activity levels from the year 2014. The BRFSS is administered by the Centers for Disease Control and Prevention. As part of the survey, participants were asked to self-report leisure-time physical activity (eg, during the past month, other than your regular job, did you participate in any physical activities or exercises such as running, calisthenics, golf, gardening, or walking for exercise?). Self-reported leisure-time physical inactivity was ascertained from answers of <italic>no</italic> to the questions. The BRFSS physical activity data were collected for adults aged 18 years and older, thus BRFSS also reported age-adjusted physical activity data based on the US standard population. Socioeconomic status measures, such as the Gini index, were collected from the American Community Survey.</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <p>The frequency of physical activity tweets was tallied from each county and merged with physical activity levels from the BRFSS data, Gini index data, and percent of the county that received college education. The Gini index provides a standardized estimate of income inequality that may be used for comparisons between counties. Including the Gini index and education level is pertinent in the context of physical activity; these variables have been associated with levels of physical activity [<xref ref-type="bibr" rid="ref35">35</xref>].</p>
        <p>A bivariate Spearman correlation was used to determine the association between the number of physical activity–related tweets (including the number of positive, negative, and neutral tweets), the Gini index, education, and physical activity data. Multiple linear regression models were then applied to find the level of association between the proportion of physical activity–related tweets, sentiment of the tweets (ratio of positive to negative physical activity–related tweets), and physical activity data while controlling for the Gini index and education level on a county level. The relative performance of these models was compared. All analyses were performed using IBM SPSS 24.0 (IBM Corporation).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>Of the 442,959,789 unique tweets collected, 64,005,336 (14.44%) were geotagged. Of these, 234,678 (0.37%) were identified to be physical activity–related based on their hashtags. Los Angeles County (n=20,589; 8.77%), New York County (n=12,601; 5.37%), Miami–Dade County (n=7055; 3.01%), Harris County (n=6148; 2.62%), and Cook County (n=5738; 2.45%) were the 5 counties that sent the most geotagged physical activity–related tweets (<xref ref-type="fig" rid="figure1">Figure 1</xref>).</p>
      <p>Aggregated data were obtained for a total of 3138 out of 3146 counties or county equivalents. The counties omitted for analysis lacked correlated Twitter data, physical activity data, or data on the socioeconomic indicators. The mean county-level percentage of individuals that are physically active was 74.05% (SD 5.2) and 75.30% (SD 4.96) after adjusting for age (<xref ref-type="fig" rid="figure2">Figure 2</xref>). Maps of the Gini index and education levels are displayed in <xref ref-type="fig" rid="figure3">Figures 3</xref> and <xref ref-type="fig" rid="figure4">4</xref>.</p>
      <p>Our sentiment analysis showed that 7.31% (n=17,155) of the physical activity–related tweets identified were positive, 42.67% (n=100,137) were negative, and 50.02% (n=117,386) were neutral. The mean ratio between positive and negative was 0.20 (SD 0.336). <xref ref-type="boxed-text" rid="box1">Textbox 1</xref> shows example tweets. On the basis of the correlation analysis, county-level physical activity and age-adjusted physical activity level showed a significant positive weak-to-moderate correlation with the percentage of physical activity–related tweets and the sentiment of physical activity–related tweets (<xref ref-type="table" rid="table1">Table 1</xref>).</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Map of physical activity levels in the United States.</p>
        </caption>
        <graphic xlink:href="jmir_v21i6e12394_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure2" position="float">
        <label>Figure 2</label>
        <caption>
          <p>Map of physical activity–related geolocated tweets in the United States.</p>
        </caption>
        <graphic xlink:href="jmir_v21i6e12394_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure3" position="float">
        <label>Figure 3</label>
        <caption>
          <p>Map of Gini index across the United States.</p>
        </caption>
        <graphic xlink:href="jmir_v21i6e12394_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure4" position="float">
        <label>Figure 4</label>
        <caption>
          <p>Map of education level across the United States.</p>
        </caption>
        <graphic xlink:href="jmir_v21i6e12394_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <boxed-text id="box1" position="float">
        <title>Example tweets classified with positive, negative, and neutral sentiment.</title>
        <p>Classified positive:</p>
        <list list-type="bullet">
          <list-item>
            <p>“Growth physically, mentally, spiritually, financially. That will be my 2017....#instafit…”</p>
          </list-item>
          <list-item>
            <p>“I think between us we've lost a whole person! #fitgoals…”</p>
          </list-item>
          <list-item>
            <p>“Today's reminder: it's about practice, not perfection! #yogajournal…”</p>
          </list-item>
        </list>
        <p>Classified negative:</p>
        <list list-type="bullet">
          <list-item>
            <p>“I hate Tuesdays. Extra. #cardio”</p>
          </list-item>
          <list-item>
            <p>“Shoutout to #crossfit ... More like curbstomp am I right guys?! @ Portland, Oregon”</p>
          </list-item>
          <list-item>
            <p>“Back to the grind… #cardio”</p>
          </list-item>
        </list>
        <p>Classified neutral:</p>
        <list list-type="bullet">
          <list-item>
            <p>“Where’s the #belly I see it! #handful but in a good way #fitness #goals continue…”</p>
          </list-item>
          <list-item>
            <p>“Day 2 of my 2 a day workouts down #gymlife #planetfitness…”</p>
          </list-item>
          <list-item>
            <p>“Clips of my leg day #squatsanddeads #bodybuilding #powerlifting #strongman #olympiclicting #fit…”</p>
          </list-item>
        </list>
      </boxed-text>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Summary of county-level physical activity, activity-related tweets, and the Gini index.</p>
        </caption>
        <table width="1000" cellpadding="6" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="340"/>
          <col width="100"/>
          <col width="140"/>
          <col width="90"/>
          <col width="90"/>
          <col width="80"/>
          <col width="160"/>
          <thead>
            <tr valign="top">
              <td>Variable</td>
              <td>Physically active, %</td>
              <td>Physically active, % (age adjusted)</td>
              <td>Gini index</td>
              <td>Education</td>
              <td>Physical activity tweets</td>
              <td>The ratio between positive and negative physical activity tweets</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Physically active, %</td>
              <td>1</td>
              <td>0.99<sup>a</sup></td>
              <td>–0.16<sup>a</sup></td>
              <td>0.26<sup>a</sup></td>
              <td>0.38<sup>a</sup></td>
              <td>0.13<sup>a</sup></td>
            </tr>
            <tr valign="top">
              <td>Physically active, % (age adjusted)</td>
              <td>—<sup>b</sup></td>
              <td>1</td>
              <td>–1.77<sup>a</sup></td>
              <td>0.24<sup>a</sup></td>
              <td>0.34<sup>a</sup></td>
              <td>0.10<sup>a</sup></td>
            </tr>
            <tr valign="top">
              <td>Gini index</td>
              <td>—</td>
              <td>—</td>
              <td>1</td>
              <td>0.04<sup>c</sup></td>
              <td>0.05<sup>c</sup></td>
              <td>0.09<sup>a</sup></td>
            </tr>
            <tr valign="top">
              <td>Education</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>1</td>
              <td>0.22<sup>a</sup></td>
              <td>0.16<sup>a</sup></td>
            </tr>
            <tr valign="top">
              <td>Physical activity tweets</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>1</td>
              <td>0.20<sup>a</sup></td>
            </tr>
            <tr valign="top">
              <td>Positive / negative physical activity tweets ratio</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>—</td>
              <td>1</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table1fn1">
            <p><sup>a</sup><italic>P</italic>&lt;.001.</p>
          </fn>
          <fn id="table1fn2">
            <p><sup>b</sup>Not applicable.</p>
          </fn>
          <fn id="table1fn3">
            <p><sup>c</sup><italic>P</italic>&lt;.02.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <p>The regression models showed that the percentage of physical activity–related tweets was significantly associated with the physical activity level (<xref ref-type="table" rid="table2">Table 2</xref>) and age-adjusted physical activity on a county level (<xref ref-type="table" rid="table3">Table 3</xref>) while adjusting for both the Gini index and education level. However, the sentiment of the physical activity–related tweets was not a significant predictor of the physical activity level and age-adjusted physical activity on a county level after including the Gini index and education level in the model. The best-fit model for predicting county-level physical activity incorporated the percentage of physical activity–related tweets, the Gini index, and the prevalence of college education. However, the overall explained variance of the model was low (<italic>R</italic><sup>2</sup>=.11) Similarly, the best-fit model for predicting county-level physical activity (<italic>R</italic><sup>2</sup>=.09) after adjusting for age used the percentage of physical activity–related tweets, the Gini index, and the education level.</p>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Regression analysis for physical activity–related tweets and county-level physical activity level.</p>
        </caption>
        <table width="1000" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="670"/>
          <col width="100"/>
          <col width="100"/>
          <col width="100"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Variables</td>
              <td>beta</td>
              <td>SE</td>
              <td><italic>P</italic> value</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="5"><bold>Model 1<sup>a</sup></bold></td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Gini index</td>
              <td>−0.16</td>
              <td>2.54</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Education</td>
              <td>0.26</td>
              <td>.01</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Percent of physical activity–related tweets</td>
              <td>0.11</td>
              <td>.20</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td colspan="5"><bold>Model 2<sup>b</sup></bold></td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Gini index</td>
              <td>−0.12</td>
              <td>3.78</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Education</td>
              <td>2.95</td>
              <td>.01</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Sentiment of physical activity–related tweets (positive/negative ratio)</td>
              <td>−0.01</td>
              <td>.37</td>
              <td>.56</td>
            </tr>
            <tr valign="top">
              <td colspan="5"><bold>Model 3<sup>c</sup></bold></td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Gini index</td>
              <td>−0.12</td>
              <td>3.79</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Education</td>
              <td>0.30</td>
              <td>0.01</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Percent of physical activity–related tweets</td>
              <td>0.05</td>
              <td>.37</td>
              <td>.02</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Sentiment of physical activity–related tweets (positive/negative ratio)</td>
              <td>−0.01</td>
              <td>.24</td>
              <td>.53</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table2fn1">
            <p><sup>a</sup><italic>F</italic><sub>3,3137</sub>=116.30; <italic>P</italic>&lt;.001; <italic>R</italic><sup>2</sup>=.11.</p>
          </fn>
          <fn id="table2fn2">
            <p><sup>b</sup><italic>F</italic><sub>3,1704</sub>=55.99; <italic>P</italic>&lt;.001; <italic>R</italic><sup>2</sup>=.09.</p>
          </fn>
          <fn id="table2fn3">
            <p><sup>c</sup><italic>F</italic><sub>3,1704</sub>=43.517; <italic>P</italic>&lt;.001; <italic>R</italic><sup>2</sup>=.09.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap position="float" id="table3">
        <label>Table 3</label>
        <caption>
          <p>Regression analysis for physical activity–related tweets and age-adjusted county-level physical activity level.</p>
        </caption>
        <table width="1000" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="670"/>
          <col width="100"/>
          <col width="100"/>
          <col width="100"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Variables</td>
              <td>beta</td>
              <td>SE</td>
              <td><italic>P</italic> value</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="5"><bold>Model 1<sup>a</sup></bold></td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Gini index</td>
              <td>−0.18</td>
              <td>2.44</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Education</td>
              <td>0.23</td>
              <td>.01</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Percent of physical activity–related tweets</td>
              <td>0.10</td>
              <td>0.20</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td colspan="5"><bold>Model 2<sup>b</sup></bold></td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Gini index</td>
              <td>−0.13</td>
              <td>3.63</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Education</td>
              <td>0.25</td>
              <td>.01</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Sentiment of physical activity–related tweets (positive/negative ratio)</td>
              <td>−0.02</td>
              <td>.35</td>
              <td>.44</td>
            </tr>
            <tr valign="top">
              <td colspan="5"><bold>Model 3<sup>c</sup></bold></td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Gini index</td>
              <td>−0.13</td>
              <td>3.64</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Education</td>
              <td>0.26</td>
              <td>.01</td>
              <td>&lt;.001</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Percent of physical activity–related tweets</td>
              <td>0.05</td>
              <td>.23</td>
              <td>.03</td>
            </tr>
            <tr valign="top">
              <td><break/></td>
              <td>Sentiment of physical activity–related tweets (positive/negative ratio)</td>
              <td>−0.02</td>
              <td>.35</td>
              <td>.41</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table3fn1">
            <p><sup>a</sup><italic>F</italic><sub>3,3137</sub>=102.93; <italic>P</italic>&lt;.001; <italic>R</italic><sup>2</sup>=.10.</p>
          </fn>
          <fn id="table3fn2">
            <p><sup>b</sup><italic>F</italic><sub>3,1704</sub>=43.09; <italic>P</italic>&lt;.001; <italic>R</italic><sup>2</sup>=.07.</p>
          </fn>
          <fn id="table3fn3">
            <p><sup>c</sup><italic>F</italic><sub>3,1704</sub>=33.52; <italic>P</italic>&lt;.001; <italic>R</italic><sup>2</sup>=.07.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study evaluated the feasibility of using Twitter data to monitor physical activity levels by assessing whether geotagged conversations about physical activity behaviors can be extracted from Twitter and whether physical activity–related tweets could be used to monitor physical activity levels. Results suggest that it is feasible to extract physical activity–related geotagged conversations from Twitter. Furthermore, the results suggest that there was a significant association between physical activity–related tweets and physical activity levels while accounting for the Gini index of income inequality, population, and education on a county level across the United States. However, the overall association between physical activity–related tweets and physical activity levels on a county level was weak.</p>
      </sec>
      <sec>
        <title>Research Implications</title>
        <p>Exploring the relationship between physical activity–related tweets and physical activity levels on a county level has several important research implications. First, these findings support the continued research in using nontraditional data sources, such as social media data, to monitor physical activity–related behaviors. Second, our results demonstrated a potential application for using social media data as a complementary tool to aid in both historical and real-time tracking of population-level physical activity. A strength of this study is controlling for related demographic factors such as income inequality and education in various geographic locations in our model. Finally, physical activity researchers can build upon the methods used in this study to find new methods of using social media data to monitor physical activity outcomes. Physical activity researchers can leverage these social media analysis techniques to build models that can predict physical activity levels in real-time. The analysis methods used in this study could in the future aid public health agencies in identifying particular physical activity–related trends or geographical areas of concern on which to focus their health and wellness initiatives.</p>
        <p>Findings from this study validate and extend previously published work that the content of the tweets can be potentially used to monitor and predict behavior and health outcomes [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. It is worth noting that even though we did not show a significant association between the sentiment of physical activity–related tweets and age-adjusted physical activity on a county level, previous studies have shown that the sentiment of the tweets can be used to predict health outcomes. Specifically, a previous study reported that positive sentiment tweets were moderately correlated with lower obesity rates in 190 US MSAs [<xref ref-type="bibr" rid="ref28">28</xref>]. These findings suggest that sentiment analysis may not be an appropriate estimator of physical activity level on a county level but may still be an appropriate estimator in other health-related outcomes on an MSA level.</p>
        <p>Although infoveillance or infodemiology studies such as this are important to epidemiology to avoid <italic>ecological fallacies</italic> [<xref ref-type="bibr" rid="ref19">19</xref>], it is critical for future research to examine the relationship between social media data and physical activity level on an individual level. Studying the prevalence of physical activity is a complex and nuanced topic, one that may be strongly influenced by an individual’s surrounding environment. We were able to obtain improved model performance through the inclusion of per county Gini index data on income inequality and education level. However, future studies will need to investigate whether other known metrics or indicators (eg, the built environment) can be incorporated into Twitter data to create models with improved accuracy in predicting physical activity.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>There are several limitations in the study. There was a lag time and time frame disparity between the Twitter data and physical activity data. The most recent county-level physical activity data, collected as part of its annual BRFSS surveys, was from 2014. In addition, there exist inherent biases that must be noted for any sampling of geotagged Twitter data. Studies on demographics on the platform have found a skew toward a younger, wealthier demographic in general [<xref ref-type="bibr" rid="ref21">21</xref>], as well as increased representation from minority groups and urban populations when looking at geotagged tweets in particular [<xref ref-type="bibr" rid="ref30">30</xref>]. This means that the observed relationship between physical activity–related tweets and physical activity needs to be interpreted with caution as certain demographic or regional groups may be predisposed toward a certain physical activity level. Nevertheless, this study was a feasibility study primarily designed to evaluate whether social media conversations that suggest physical activity–related behaviors could be extracted and used to monitor physical activity at a population level. Second, we only used one source of social media data (Twitter), thus limiting the generalizability of our findings. Using Twitter API’s <italic>garden hose</italic> approach with geographic filtering also limits data collection to less than a 1% random sample of all tweets posted in any given time frame. Future studies will need to explore whether model accuracy can be improved using multiple data sources (eg, Twitter, Facebook, and Instagram) to exploit user overlap between certain social media platforms as well as over a longer data collection period. Finally, studies of this nature rely heavily on the accuracy of the classifier for labeling physical activity–related tweets and conducting sentiment analysis. In particular, the finer-grained filtering offered by sentiment analysis did not appear to offer a notable improvement in fit or classification accuracy. It should be noted that this failure of complex or synthesized features to improve model quality has been observed earlier [<xref ref-type="bibr" rid="ref28">28</xref>]. Subsequent studies may supplant our list-of-hashtags classifier with machine-learning classification approaches to potentially discover keywords, text structure, or other features that may be used to boost both precision and recall, as well as attempt using state-of-the-art sentiment analysis techniques to construct and train custom classifiers that are a better fit for this specific subset of Twitter data.</p>
        <p>Moving forward, there are still other possible features to extract from Twitter data that may be tested for association with levels of physical activity. Although this study focused exclusively on filtering Twitter data by keywords and conducting sentiment analysis, there may be other natural language processing techniques that could be applied to the dataset [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. Future research could investigate training predictive models on a larger, longitudinal dataset of both tweets and physical activity data. If successful, such models could be leveraged to effectively predict levels of physical activity and inactivity using social media data.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study evaluated the feasibility of using social media data to monitor physical activity levels on a county-by-county basis. Results from this study suggest that it is feasible to identify geotagged physical activity–related conversations from Twitter data and link them to population-based physical activity outcome data for analyses. We found that the conversation from tweets was weakly associated with county-level physical activity levels in the United States. Future research can build on the methods used in this study to further refine the models that use real-time social media data to monitor physical activity levels.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>Hashtags used to identify tweets related to physical activity.</p>
        <media xlink:href="jmir_v21i6e12394_app1.docx" xlink:title="DOCX File, 14KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ACSM</term>
          <def>
            <p>American College of Sports Medicine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">BRFSS</term>
          <def>
            <p>Behavioral Risk Factor Surveillance System</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">MSA</term>
          <def>
            <p>Metropolitan Statistical Area</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">SemEval</term>
          <def>
            <p>Semantic Evaluation</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work is supported by the Internal Research Creative Project Grant at the University of Victoria.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Warburton</surname>
            <given-names>DE</given-names>
          </name>
          <name name-style="western">
            <surname>Nicol</surname>
            <given-names>CW</given-names>
          </name>
          <name name-style="western">
            <surname>Bredin</surname>
            <given-names>SS</given-names>
          </name>
        </person-group>
        <article-title>Health benefits of physical activity: the evidence</article-title>
        <source>CMAJ</source>  
        <year>2006</year>  
        <month>03</month>  
        <day>14</day>  
        <volume>174</volume>  
        <issue>6</issue>  
        <fpage>801</fpage>  
        <lpage>9</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.cmaj.ca/cgi/pmidlookup?view=long&amp;pmid=16534088"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1503/cmaj.051351</pub-id>
        <pub-id pub-id-type="medline">16534088</pub-id>
        <pub-id pub-id-type="pii">174/6/801</pub-id>
        <pub-id pub-id-type="pmcid">PMC1402378</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Goodman</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Nolan</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Lacombe</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Thomas</surname>
            <given-names>SG</given-names>
          </name>
        </person-group>
        <article-title>Blood pressure responses to acute and chronic exercise are related in prehypertension</article-title>
        <source>Med Sci Sports Exerc</source>  
        <year>2012</year>  
        <month>09</month>  
        <volume>44</volume>  
        <issue>9</issue>  
        <fpage>1644</fpage>  
        <lpage>52</lpage>  
        <pub-id pub-id-type="doi">10.1249/MSS.0b013e31825408fb</pub-id>
        <pub-id pub-id-type="medline">22899388</pub-id>
        <pub-id pub-id-type="pii">00005768-201209000-00004</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lacombe</surname>
            <given-names>SP</given-names>
          </name>
          <name name-style="western">
            <surname>Goodman</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Spragg</surname>
            <given-names>CM</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Thomas</surname>
            <given-names>SG</given-names>
          </name>
        </person-group>
        <article-title>Interval and continuous exercise elicit equivalent postexercise hypotension in prehypertensive men, despite differences in regulation</article-title>
        <source>Appl Physiol Nutr Metab</source>  
        <year>2011</year>  
        <month>12</month>  
        <volume>36</volume>  
        <issue>6</issue>  
        <fpage>881</fpage>  
        <lpage>91</lpage>  
        <pub-id pub-id-type="doi">10.1139/h11-113</pub-id>
        <pub-id pub-id-type="medline">22070641</pub-id></nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Umpierre</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Ribeiro</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Kramer</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Leitão</surname>
            <given-names>Cristiane B</given-names>
          </name>
          <name name-style="western">
            <surname>Zucatti</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Azevedo</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Gross</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Ribeiro</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Schaan</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Physical activity advice only or structured exercise training and association with HbA1c levels in type 2 diabetes: a systematic review and meta-analysis</article-title>
        <source>J Am Med Assoc</source>  
        <year>2011</year>  
        <month>05</month>  
        <day>4</day>  
        <volume>305</volume>  
        <issue>17</issue>  
        <fpage>1790</fpage>  
        <lpage>9</lpage>  
        <pub-id pub-id-type="doi">10.1001/jama.2011.576</pub-id>
        <pub-id pub-id-type="medline">21540423</pub-id>
        <pub-id pub-id-type="pii">305/17/1790</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Friedenreich</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Orenstein</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Physical activity and cancer prevention: etiologic evidence and biological mechanisms</article-title>
        <source>J Nutr</source>  
        <year>2002</year>  
        <month>12</month>  
        <volume>132</volume>  
        <issue>11 Suppl</issue>  
        <fpage>3456S</fpage>  
        <lpage>4S</lpage>  
        <pub-id pub-id-type="doi">10.1093/jn/132.11.3456S</pub-id>
        <pub-id pub-id-type="medline">12421870</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="book">
        <source>PAGA. Physical Activity Guidelines Advisory Committee Report</source>  
        <year>2008</year>  
        <publisher-loc>Washington, DC</publisher-loc>
        <publisher-name>US Department of Health and Human Services</publisher-name></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
        <source>Centers for Disease Control and Prevention</source>  
        <access-date>2019-05-15</access-date>
        <comment>Facts about Physical Activity 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/physicalactivity/data/facts.htm">https://www.cdc.gov/physicalactivity/data/facts.htm</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="78ONZdpa5"/></comment> </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Caspersen</surname>
            <given-names>CJ</given-names>
          </name>
          <name name-style="western">
            <surname>Pereira</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Curran</surname>
            <given-names>KM</given-names>
          </name>
        </person-group>
        <article-title>Changes in physical activity patterns in the United States, by sex and cross-sectional age</article-title>
        <source>Med Sci Sports Exerc</source>  
        <year>2000</year>  
        <month>09</month>  
        <volume>32</volume>  
        <issue>9</issue>  
        <fpage>1601</fpage>  
        <lpage>9</lpage>  
        <pub-id pub-id-type="medline">10994912</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Trost</surname>
            <given-names>SG</given-names>
          </name>
          <name name-style="western">
            <surname>Owen</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Bauman</surname>
            <given-names>AE</given-names>
          </name>
          <name name-style="western">
            <surname>Sallis</surname>
            <given-names>JF</given-names>
          </name>
          <name name-style="western">
            <surname>Brown</surname>
            <given-names>W</given-names>
          </name>
        </person-group>
        <article-title>Correlates of adults' participation in physical activity: review and update</article-title>
        <source>Med Sci Sports Exerc</source>  
        <year>2002</year>  
        <month>12</month>  
        <volume>34</volume>  
        <issue>12</issue>  
        <fpage>1996</fpage>  
        <lpage>2001</lpage>  
        <pub-id pub-id-type="doi">10.1249/01.MSS.0000038974.76900.92</pub-id>
        <pub-id pub-id-type="medline">12471307</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Young</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>A survey of social media data analysis for physical activity surveillance</article-title>
        <source>J Forensic Leg Med</source>  
        <year>2018</year>  
        <month>07</month>  
        <volume>57</volume>  
        <fpage>33</fpage>  
        <lpage>36</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.jflm.2016.10.019</pub-id>
        <pub-id pub-id-type="medline">29801949</pub-id>
        <pub-id pub-id-type="pii">S1752-928X(16)30141-X</pub-id>
        <pub-id pub-id-type="pmcid">PMC6276785</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Dunford</surname>
            <given-names>SD</given-names>
          </name>
          <name name-style="western">
            <surname>Leung</surname>
            <given-names>YW</given-names>
          </name>
          <name name-style="western">
            <surname>Brooks</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Thomas</surname>
            <given-names>SG</given-names>
          </name>
          <name name-style="western">
            <surname>Eysenbach</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Nolan</surname>
            <given-names>RP</given-names>
          </name>
        </person-group>
        <article-title>Reducing blood pressure with internet-based interventions: a meta-analysis</article-title>
        <source>Can J Cardiol</source>  
        <year>2013</year>  
        <month>05</month>  
        <volume>29</volume>  
        <issue>5</issue>  
        <fpage>613</fpage>  
        <lpage>21</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.cjca.2013.02.007</pub-id>
        <pub-id pub-id-type="medline">23618507</pub-id>
        <pub-id pub-id-type="pii">S0828-282X(13)00075-5</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Brooks</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Thomas</surname>
            <given-names>SG</given-names>
          </name>
          <name name-style="western">
            <surname>Eysenbach</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Nolan</surname>
            <given-names>RP</given-names>
          </name>
        </person-group>
        <article-title>Effectiveness of user-and expert-driven web-based hypertension programs: an RCT</article-title>
        <source>Am J Prev Med</source>  
        <year>2018</year>  
        <month>12</month>  
        <volume>54</volume>  
        <issue>4</issue>  
        <fpage>576</fpage>  
        <lpage>83</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.amepre.2018.01.009</pub-id>
        <pub-id pub-id-type="medline">29456025</pub-id>
        <pub-id pub-id-type="pii">S0749-3797(18)30015-1</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Hodgson</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Zbib</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Payne</surname>
            <given-names>AY</given-names>
          </name>
          <name name-style="western">
            <surname>Nolan</surname>
            <given-names>RP</given-names>
          </name>
        </person-group>
        <article-title>The effectiveness of loyalty rewards to promote the use of an Internet-based heart health program</article-title>
        <source>J Med Internet Res</source>  
        <year>2014</year>  
        <month>07</month>  
        <volume>16</volume>  
        <issue>7</issue>  
        <fpage>e163</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2014/7/e163/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.3458</pub-id>
        <pub-id pub-id-type="medline">24989982</pub-id>
        <pub-id pub-id-type="pii">v16i7e163</pub-id>
        <pub-id pub-id-type="pmcid">PMC4115265</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nolan</surname>
            <given-names>RP</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Shoemaker</surname>
            <given-names>JK</given-names>
          </name>
          <name name-style="western">
            <surname>Hachinski</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Lynn</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Mikulis</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Wennberg</surname>
            <given-names>RA</given-names>
          </name>
          <name name-style="western">
            <surname>Moy</surname>
            <given-names>LM</given-names>
          </name>
          <name name-style="western">
            <surname>Zbib</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Therapeutic benefit of internet-based lifestyle counselling for hypertension</article-title>
        <source>Can J Cardiol</source>  
        <year>2012</year>  
        <month>05</month>  
        <volume>28</volume>  
        <issue>3</issue>  
        <fpage>390</fpage>  
        <lpage>6</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.cjca.2012.02.012</pub-id>
        <pub-id pub-id-type="medline">22498181</pub-id>
        <pub-id pub-id-type="pii">S0828-282X(12)00106-7</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Valle</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Tate</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Mayer</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Allicock</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Cai</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>A randomized trial of a Facebook-based physical activity intervention for young adult cancer survivors</article-title>
        <source>J Cancer Surviv</source>  
        <year>2013</year>  
        <month>09</month>  
        <volume>7</volume>  
        <issue>3</issue>  
        <fpage>355</fpage>  
        <lpage>68</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23532799"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/s11764-013-0279-5</pub-id>
        <pub-id pub-id-type="medline">23532799</pub-id>
        <pub-id pub-id-type="pmcid">PMC3737370</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Salathé</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Digital epidemiology: what is it, and where is it going?</article-title>
        <source>Life Sci Soc Policy</source>  
        <year>2018</year>  
        <month>01</month>  
        <day>4</day>  
        <volume>14</volume>  
        <issue>1</issue>  
        <fpage>1</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29302758"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/s40504-017-0065-7</pub-id>
        <pub-id pub-id-type="medline">29302758</pub-id>
        <pub-id pub-id-type="pii">10.1186/s40504-017-0065-7</pub-id>
        <pub-id pub-id-type="pmcid">PMC5754279</pub-id></nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Perrin</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <source>Pew Research Center</source>  
        <year>2015</year>  
        <access-date>2019-05-15</access-date>
        <comment>Social Media Usage 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.pewinternet.org/2015/10/08/social-networking-usage-2005-2015/">https://www.pewinternet.org/2015/10/08/social-networking-usage-2005-2015/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="78ONsKmKK"/></comment> </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Young</surname>
            <given-names>SD</given-names>
          </name>
        </person-group>
        <article-title>Recommended guidelines on using social networking technologies for HIV prevention research</article-title>
        <source>AIDS Behav</source>  
        <year>2012</year>  
        <month>10</month>  
        <volume>16</volume>  
        <issue>7</issue>  
        <fpage>1743</fpage>  
        <lpage>5</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22821067"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1007/s10461-012-0251-9</pub-id>
        <pub-id pub-id-type="medline">22821067</pub-id>
        <pub-id pub-id-type="pmcid">PMC3459230</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Eysenbach</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Infodemiology and infoveillance: framework for an emerging set of public health informatics methods to analyze search, communication and publication behavior on the Internet</article-title>
        <source>J Med Internet Res</source>  
        <year>2009</year>  
        <month>03</month>  
        <day>27</day>  
        <volume>11</volume>  
        <issue>1</issue>  
        <fpage>e11</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmir.org/2009/1/e11/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.1157</pub-id>
        <pub-id pub-id-type="medline">19329408</pub-id>
        <pub-id pub-id-type="pii">v11i1e11</pub-id>
        <pub-id pub-id-type="pmcid">PMC2762766</pub-id></nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Eysenbach</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Infodemiology and infoveillance tracking online health information and cyberbehavior for public health</article-title>
        <source>Am J Prev Med</source>  
        <year>2011</year>  
        <month>05</month>  
        <volume>40</volume>  
        <issue>5 Suppl 2</issue>  
        <fpage>S154</fpage>  
        <lpage>8</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.amepre.2011.02.006</pub-id>
        <pub-id pub-id-type="medline">21521589</pub-id>
        <pub-id pub-id-type="pii">S0749-3797(11)00088-2</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Greenwood</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Perrin</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Duggan</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <source>Pew Research Center</source>  
        <year>2017</year>  
        <access-date>2019-05-15</access-date>
        <comment>Social Media Update 2016 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.pewinternet.org/2016/11/11/social-media-update-2016/">https://www.pewinternet.org/2016/11/11/social-media-update-2016/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="78OO53jLF"/></comment> </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Zhu</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>DJ</given-names>
          </name>
          <name name-style="western">
            <surname>Rasin</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Young</surname>
            <given-names>SD</given-names>
          </name>
        </person-group>
        <article-title>Using real-time social media technologies to monitor levels of perceived stress and emotional state in college students: a web-based questionnaire study</article-title>
        <source>JMIR Ment Health</source>  
        <year>2017</year>  
        <month>01</month>  
        <day>10</day>  
        <volume>4</volume>  
        <issue>1</issue>  
        <fpage>e2</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://mental.jmir.org/2017/1/e2/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/mental.5626</pub-id>
        <pub-id pub-id-type="medline">28073737</pub-id>
        <pub-id pub-id-type="pii">v4i1e2</pub-id>
        <pub-id pub-id-type="pmcid">PMC5263861</pub-id></nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Zhu</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Young</surname>
            <given-names>SD</given-names>
          </name>
        </person-group>
        <article-title>Monitoring freshman college experience through content analysis of tweets: observational study</article-title>
        <source>JMIR Public Health Surveill</source>  
        <year>2018</year>  
        <month>01</month>  
        <day>11</day>  
        <volume>4</volume>  
        <issue>1</issue>  
        <fpage>e5</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://publichealth.jmir.org/2018/1/e5/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/publichealth.7444</pub-id>
        <pub-id pub-id-type="medline">29326096</pub-id>
        <pub-id pub-id-type="pii">v4i1e5</pub-id>
        <pub-id pub-id-type="pmcid">PMC5785682</pub-id></nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Young</surname>
            <given-names>SD</given-names>
          </name>
          <name name-style="western">
            <surname>Rivers</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Lewis</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <article-title>Methods of using real-time social media technologies for detection and remote monitoring of HIV outcomes</article-title>
        <source>Prev Med</source>  
        <year>2014</year>  
        <month>06</month>  
        <volume>63</volume>  
        <fpage>112</fpage>  
        <lpage>5</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24513169"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.ypmed.2014.01.024</pub-id>
        <pub-id pub-id-type="medline">24513169</pub-id>
        <pub-id pub-id-type="pii">S0091-7435(14)00055-3</pub-id>
        <pub-id pub-id-type="pmcid">PMC4031268</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bodnar</surname>
            <given-names>TS</given-names>
          </name>
        </person-group>
        <article-title>Validating models for disease detection using twitter</article-title>
        <year>2013</year>  
        <month>05</month>  
        <conf-name>WWW'13 Companion</conf-name>
        <conf-date>May 13-17, 2013</conf-date>
        <conf-loc>Rio de Janeiro, Brazil</conf-loc>
        <fpage>699</fpage>  
        <lpage>702</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dl.acm.org/citation.cfm?id=2487788.2488027"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Broniatowski</surname>
            <given-names>DA</given-names>
          </name>
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>National and local influenza surveillance through Twitter: an analysis of the 2012-2013 influenza epidemic</article-title>
        <source>PLoS One</source>  
        <year>2013</year>  
        <volume>8</volume>  
        <issue>12</issue>  
        <fpage>e83672</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0083672"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0083672</pub-id>
        <pub-id pub-id-type="medline">24349542</pub-id>
        <pub-id pub-id-type="pii">PONE-D-13-35058</pub-id>
        <pub-id pub-id-type="pmcid">PMC3857320</pub-id></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chew</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Eysenbach</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Pandemics in the age of Twitter: content analysis of Tweets during the 2009 H1N1 outbreak</article-title>
        <source>PLoS One</source>  
        <year>2010</year>  
        <volume>5</volume>  
        <issue>11</issue>  
        <fpage>e14118</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0014118"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0014118</pub-id>
        <pub-id pub-id-type="medline">21124761</pub-id>
        <pub-id pub-id-type="pmcid">PMC2993925</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gore</surname>
            <given-names>RJ</given-names>
          </name>
          <name name-style="western">
            <surname>Diallo</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Padilla</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>You are what you tweet: connecting the geographic variation in america's obesity rate to Twitter content</article-title>
        <source>PLoS One</source>  
        <year>2015</year>  
        <volume>10</volume>  
        <issue>9</issue>  
        <fpage>e0133505</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0133505"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0133505</pub-id>
        <pub-id pub-id-type="medline">26332588</pub-id>
        <pub-id pub-id-type="pii">PONE-D-15-02269</pub-id>
        <pub-id pub-id-type="pmcid">PMC4557976</pub-id></nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nguyen</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Meng</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Kath</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Nsoesie</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Wen</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Building a national neighborhood dataset from geotagged Twitter data for indicators of happiness, diet, and physical activity</article-title>
        <source>JMIR Public Health Surveill</source>  
        <year>2016</year>  
        <month>10</month>  
        <day>17</day>  
        <volume>2</volume>  
        <issue>2</issue>  
        <fpage>e158</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://publichealth.jmir.org/2016/2/e158/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/publichealth.5869</pub-id>
        <pub-id pub-id-type="medline">27751984</pub-id>
        <pub-id pub-id-type="pii">v2i2e158</pub-id>
        <pub-id pub-id-type="pmcid">PMC5088343</pub-id></nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>You are what you tweet: Analyzing twitter for public health</article-title>
        <year>2011</year>  
        <conf-name>Fifth International AAAI Conference on Weblogs and Social Media</conf-name>
        <conf-date>July 17–21, 2011</conf-date>
        <conf-loc>Barcelona, Catalonia, ES</conf-loc></nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Manley</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <source>Physical Activity And Health: A Report Of The Surgeon General</source>  
        <year>2019</year>  
        <publisher-loc>Darby, PA</publisher-loc>
        <publisher-name>Diane Pub Co</publisher-name></nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Baziotis</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Pelekis</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Doulkeridis</surname>
            <given-names>C</given-names>
          </name>
        </person-group>
        <article-title>DataStories at SemEval-2017 Task 4: Deep LSTM with Attention for Message-level and Topic-based Sentiment Analysis</article-title>
        <year>2017</year>  
        <conf-name>International Workshop on Semantic Evaluation 2011</conf-name>
        <conf-date>August 3-4, 2017</conf-date>
        <conf-loc>Vancouver, Canada</conf-loc>
        <fpage>747</fpage> </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bethard</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Carpuat</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Cer</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Jurgens</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Nakov</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Zesch</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <source>Association for Computational Linguistics</source>  
        <year>2016</year>  
        <access-date>2019-05-17</access-date>
        <comment>Proceedings of the 10th International Workshop on Semantic Evaluation (SemEval-2016) 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.aclweb.org/anthology/S16-1000">https://www.aclweb.org/anthology/S16-1000</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="78QcxPpyr"/></comment> </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Rocktäschel</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Grefenstette</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Hermann</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Kočiský</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Blunsom</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <source>arXiv</source>  
        <year>2015</year>  
        <access-date>2019-05-17</access-date>
        <comment>Reasoning about entailment with neural attention 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1509.06664">https://arxiv.org/abs/1509.06664</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="78Qd71Did"/></comment> </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Giles-Corti</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Donovan</surname>
            <given-names>RJ</given-names>
          </name>
        </person-group>
        <article-title>Socioeconomic status differences in recreational physical activity levels and real and perceived access to a supportive physical environment</article-title>
        <source>Prev Med</source>  
        <year>2002</year>  
        <month>12</month>  
        <volume>35</volume>  
        <issue>6</issue>  
        <fpage>601</fpage>  
        <lpage>11</lpage>  
        <pub-id pub-id-type="medline">12460528</pub-id>
        <pub-id pub-id-type="pii">S0091743502911151</pub-id></nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kumar</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <source>Twitter Data Analytics</source>  
        <year>2014</year>  
        <publisher-loc>New York</publisher-loc>
        <publisher-name>Springer</publisher-name></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
