<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v19i3e91</article-id>
    <article-id pub-id-type="pmid">28363883</article-id>
    <article-id pub-id-type="doi">10.2196/jmir.7022</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Original Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Original Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>Methods for Coding Tobacco-Related Twitter Data: A Systematic Review</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Keepanasseril</surname>
          <given-names>Arun</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Conway</surname>
          <given-names>Mike</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Wen</surname>
          <given-names>Kuang-Yi</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1" corresp="yes" equal-contrib="yes">
      <name name-style="western">
        <surname>Lienemann</surname>
        <given-names>Brianna A</given-names>
      </name>
      <degrees>PhD</degrees>
      <xref rid="aff1" ref-type="aff">1</xref>
      <address>
        <institution>Department of Preventive Medicine</institution>
        <institution>Keck School of Medicine</institution>
        <institution>University of Southern California</institution>
        <addr-line>2001 N Soto St</addr-line>
        <addr-line>Los Angeles, CA, 90032</addr-line>
        <country>United States</country>
        <phone>1 3109241711</phone>
        <fax>1 3109241711</fax>
        <email>blienema@usc.edu</email>
      </address>  
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-7276-1816</ext-link></contrib>
      <contrib contrib-type="author" id="contrib2">
        <name name-style="western">
          <surname>Unger</surname>
          <given-names>Jennifer B</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-9064-6603</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib3">
        <name name-style="western">
          <surname>Cruz</surname>
          <given-names>Tess Boley</given-names>
        </name>
        <degrees>MPH, PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-5894-1802</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib4">
        <name name-style="western">
          <surname>Chu</surname>
          <given-names>Kar-Hai</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-2486-8846</ext-link>
      </contrib>
    </contrib-group>
    <aff id="aff1">
    <sup>1</sup>
    <institution>Department of Preventive Medicine</institution>
    <institution>Keck School of Medicine</institution>  
    <institution>University of Southern California</institution>  
    <addr-line>Los Angeles, CA</addr-line>
    <country>United States</country></aff>
    <author-notes>
      <corresp>Corresponding Author: Brianna A Lienemann 
      <email>blienema@usc.edu</email></corresp>
    </author-notes>
    <pub-date pub-type="collection"><month>03</month><year>2017</year></pub-date>
    <pub-date pub-type="epub">
      <day>31</day>
      <month>03</month>
      <year>2017</year>
    </pub-date>
    <volume>19</volume>
    <issue>3</issue>
    <elocation-id>e91</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>30</day>
        <month>11</month>
        <year>2016</year>
      </date>
      <date date-type="rev-request">
        <day>22</day>
        <month>1</month>
        <year>2017</year>
      </date>
      <date date-type="rev-recd">
        <day>26</day>
        <month>1</month>
        <year>2017</year>
      </date>
      <date date-type="accepted">
        <day>23</day>
        <month>2</month>
        <year>2017</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©Brianna A Lienemann, Jennifer B Unger, Tess Boley Cruz, Kar-Hai Chu. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 31.03.2017.</copyright-statement>
    <copyright-year>2017</copyright-year>
    <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://www.jmir.org/2017/3/e91/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="background">
        <title>Background</title>
        <p>As Twitter has grown in popularity to 313 million monthly active users, researchers have increasingly been using it as a data source for tobacco-related research.</p>
      </sec>
      <sec sec-type="objective">
        <title>Objective</title>
        <p>The objective of this systematic review was to assess the methodological approaches of categorically coded tobacco Twitter data and make recommendations for future studies.</p>
      </sec>
      <sec sec-type="methods">
        <title>Methods</title>
        <p>Data sources included PsycINFO, Web of Science, PubMed, ABI/INFORM, Communication Source, and Tobacco Regulatory Science. Searches were limited to peer-reviewed journals and conference proceedings in English from January 2006 to July 2016. The initial search identified 274 articles using a Twitter keyword and a tobacco keyword. One coder reviewed all abstracts and identified 27 articles that met the following inclusion criteria: (1) original research, (2) focused on tobacco or a tobacco product, (3) analyzed Twitter data, and (4) coded Twitter data categorically. One coder extracted data collection and coding methods.</p>
      </sec>
      <sec sec-type="results">
        <title>Results</title>
        <p>E-cigarettes were the most common type of Twitter data analyzed, followed by specific tobacco campaigns. The most prevalent data sources were Gnip and Twitter’s Streaming application programming interface (API). The primary methods of coding were hand-coding and machine learning. The studies predominantly coded for relevance, sentiment, theme, user or account, and location of user.</p>
      </sec>
      <sec sec-type="conclusions">
        <title>Conclusions</title>
        <p>Standards for data collection and coding should be developed to be able to more easily compare and replicate tobacco-related Twitter results. Additional recommendations include the following: sample Twitter’s databases multiple times, make a distinction between message attitude and emotional tone for sentiment, code images and URLs, and analyze user profiles. Being relatively novel and widely used among adolescents and black and Hispanic individuals, Twitter could provide a rich source of tobacco surveillance data among vulnerable populations.</p>
      </sec>
    </abstract>
    <kwd-group>
      <kwd>tobacco</kwd>
      <kwd>Internet</kwd>
      <kwd>social marketing</kwd>
      <kwd>review</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>As Twitter has grown in popularity to 313 million monthly active users [<xref ref-type="bibr" rid="ref1">1</xref>], researchers have increasingly been using it as a data source for tobacco-related research. Twitter is a microblogging platform where users have 140 characters to share thoughts, jokes, information, images, and URLs (ie, Web addresses). Twitter posts (ie, tweets) are in real time and often public, with the potential to reach a wide audience. Users can retweet or share tweets with others, which can cause tweets to spread to large numbers of users (“go viral”). Posts can be seen when users follow each other or search for specific terms (eg, #vape). Hashtags signify a topic for users to participate in the conversation. Antitobacco campaigns may use a hashtag to start a conversation about the harms of tobacco, for example, the Truth Initiative account, @truthinitiative, promotes the use of #tobaccofreegen in the user description [<xref ref-type="bibr" rid="ref2">2</xref>]. Similarly, the tobacco industry and independent manufacturers can use Twitter to advertise their products. Imperial Brands uses such an approach when it promotes the electronic cigarette (e-cigarette) blu through its account, @blucigs, with the hashtag #JustYouAndblu in the user description and messages to engage with Twitter users [<xref ref-type="bibr" rid="ref3">3</xref>]. Furthermore, social media can be used to counter antitobacco campaigns. When the anti–e-cigarette campaign Still Blowing Smoke [<xref ref-type="bibr" rid="ref4">4</xref>] was released by the State of California on television and Facebook, the pro–e-cigarette campaign Not Blowing Smoke [<xref ref-type="bibr" rid="ref5">5</xref>], developed by pro-vaping groups, countered by taking the Twitter handles @StillBlwngSmoke [<xref ref-type="bibr" rid="ref6">6</xref>] and @NotBlwngSmoke [<xref ref-type="bibr" rid="ref7">7</xref>] to challenge the California campaign’s messages [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
      <p>Tobacco-related tweets can reach a relatively young and ethnically diverse audience. Pew Research Center studies have found that, in the United States, a third of teenagers use Twitter [<xref ref-type="bibr" rid="ref9">9</xref>], while 20% of adults have accounts with the majority being younger than 50 years [<xref ref-type="bibr" rid="ref10">10</xref>]. Twitter is especially popular among girls aged 15 to 17 years with 49% having accounts [<xref ref-type="bibr" rid="ref9">9</xref>]. Similarly, 45% of black, 34% of Hispanic, and 31% of white adolescents use Twitter [<xref ref-type="bibr" rid="ref9">9</xref>]. Comparably, a larger proportion of black (28%) and Hispanic (28%) than white (20%) adult <italic>Internet users</italic> also use Twitter [<xref ref-type="bibr" rid="ref10">10</xref>]. Therefore, tobacco conversations on Twitter, whether pro or anti, may be particularly likely to reach these populations.</p>
      <p>Research utilizing Twitter data is fairly novel without established standards across studies. Thus, it could be advantageous to establish what methods are being used and their strengths and weaknesses. Standards for reporting social media data are needed to be able to compare methods and results across studies [<xref ref-type="bibr" rid="ref11">11</xref>]. This review focuses specifically on the methodology of tobacco-related studies that code Twitter data categorically by examining data collection methods, coding methods, and coding categories. It addresses the questions, “What methodologies are used to categorically code tobacco-related Twitter data” and “What recommendations can be made for future studies?”</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Sources</title>
        <p>A literature search was conducted in July 2016 using the databases PsycINFO, Web of Science, PubMed, ABI/INFORM, Communication Source, and the journal Tobacco Regulatory Science. Searches included a Twitter term and a tobacco term: (Twitter OR tweet) AND (tobacco OR nicotine OR...) (<xref ref-type="table" rid="table1">Table 1</xref>). Tobacco terms were selected based on an article on noncigarette tobacco products [<xref ref-type="bibr" rid="ref12">12</xref>] and the US Food and Drug Administration’s (FDA) article, <italic>Recognize Tobacco in Its Many Forms</italic> [<xref ref-type="bibr" rid="ref13">13</xref>]. Searches were limited to peer-reviewed journals in English published from January 2006 to those available in July 2016. The beginning date was selected because Twitter was launched in 2006. The initial search produced 274 nonduplicate articles (<xref ref-type="fig" rid="figure1">Figure 1</xref>).</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Tobacco search terms.</p>
          </caption>
          <table width="707" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="106"/>
            <col width="571"/>
            <thead>
              <tr valign="top">
                <td>Search term<sup>a</sup></td>
                <td>Tobacco products covered by search term</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>tobacco</td>
                <td>Tobacco, smokeless tobacco, chewing tobacco, dissolvable tobacco</td>
              </tr>
              <tr valign="top">
                <td>nicotine</td>
                <td>Nicotine, electronic nicotine delivery system</td>
              </tr>
              <tr valign="top">
                <td>cig*</td>
                <td>Cigarette, cigar, little cigar, large cigar, cigarillo, electronic cigarette, e-cigarette, e-cig</td>
              </tr>
              <tr valign="top">
                <td>pipe</td>
                <td>Pipe, waterpipe</td>
              </tr>
              <tr valign="top">
                <td>bidi</td>
                <td>Bidi</td>
              </tr>
              <tr valign="top">
                <td>kretek</td>
                <td>Kretek</td>
              </tr>
              <tr valign="top">
                <td>shisha</td>
                <td>Shisha</td>
              </tr>
              <tr valign="top">
                <td>hookah</td>
                <td>Hookah, e-hookah, hookah pen</td>
              </tr>
              <tr valign="top">
                <td>narghile</td>
                <td>Narghile</td>
              </tr>
              <tr valign="top">
                <td>argileh</td>
                <td>Argileh</td>
              </tr>
              <tr valign="top">
                <td>cheroot</td>
                <td>Cheroot</td>
              </tr>
              <tr valign="top">
                <td>smok*</td>
                <td>Smoke, smokeless tobacco, smoking, smoker</td>
              </tr>
              <tr valign="top">
                <td>chew</td>
                <td>Chew, chewing tobacco</td>
              </tr>
              <tr valign="top">
                <td>snuff</td>
                <td>Snuff, dry snuff, moist snuff</td>
              </tr>
              <tr valign="top">
                <td>snus</td>
                <td>Snus</td>
              </tr>
              <tr valign="top">
                <td>betel quid</td>
                <td>Betel quid</td>
              </tr>
              <tr valign="top">
                <td>gutkha</td>
                <td>Gutkha</td>
              </tr>
              <tr valign="top">
                <td>zarda</td>
                <td>Zarda</td>
              </tr>
              <tr valign="top">
                <td>toombak</td>
                <td>Toombak</td>
              </tr>
              <tr valign="top">
                <td>dissolvable</td>
                <td>Dissolvable, dissolvable tobacco</td>
              </tr>
              <tr valign="top">
                <td>ENDS</td>
                <td>ENDS (electronic nicotine delivery system)</td>
              </tr>
              <tr valign="top">
                <td>vap*</td>
                <td>Vape, vaper, vape pen, vaping, vapor</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Asterisk (*) represents stemmed words; for example, cig* would capture all words beginning with cig.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) diagram of articles included in the systematic review.</p>
          </caption>
          <graphic xlink:href="jmir_v19i3e91_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Study Selection</title>
        <p>One coder independently reviewed all titles and abstracts and selected 43 articles from the initial 274 that referenced any of the tobacco products and Twitter. Full text of the articles was then reviewed. Explicit inclusion criteria were determined a priori to reduce coder bias when selecting articles. Articles were included in the review if they met the following criteria: (1) original research in a peer-reviewed journal, (2) focused on tobacco, (3) analyzed Twitter data, and (4) coded data categorically (eg, sentiment, theme). If an article was excluded for failing to meet multiple inclusion criteria, it was counted in the higher-order criteria for exclusion. A total of 16 articles were excluded, so 27 articles were included in the review (<xref ref-type="fig" rid="figure1">Figure 1</xref>). We excluded 1 article because it was a narrative review rather than original research, 2 articles because they did not address a tobacco product, 1 article because it analyzed Web search results and tobacco control websites rather than Twitter data, and 12 articles because they did not categorically code tobacco-related Twitter data. For example, a study may have tracked changes in the number of tweets over time but not coded the tweets categorically. The 27 included articles ranged from 2011 to 2016. Although there is risk for bias in studies, this review considered all studies that met the inclusion criteria to evaluate the strengths and weakness of all methodological approaches within this domain. The primary focus of this review is the methodology of qualitative studies rather than the outcomes of quantitative studies. Therefore, the risk of publication bias of studies with significant results and selective reporting of significant results is minimal for this type of review compared with a meta-analysis of quantitative outcomes.</p>
      </sec>
      <sec>
        <title>Data Extraction</title>
        <p>One author read each article to extract methodological information on data collection (data sources, date collected, tobacco topics, search keyword selection), coding methods (type of coding method, number of coders, number of tweets coded, coded retweets, number of Twitter accounts, followed URLs, coding agreement), and coded categories. This information is presented in detail in <xref ref-type="table" rid="table2">Tables 2</xref>, <xref ref-type="table" rid="table3">3</xref>, and <xref ref-type="table" rid="table4">4</xref> and is summarized in the results.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Data Collection Methods</title>
        <sec>
          <title>Data Sources</title>
          <p>In total, 22 of the 27 articles discussed the sources they used for their sample of Twitter messages, while 5 articles did not. Twitter provides 3 primary sources of data: Twitter’s Search application programming interface (API), Twitter’s Streaming API, and Twitter’s Firehose. An additional method is Twitter’s REST API, which allows tracking specific users by their username. One study collected data using Twitter’s REST API.</p>
          <p>Twitter’s Search API is free to use and provides a maximum of 3200 past tweets (ie, published in the past 7 days, so it is not in real time) with a limit of 180 searches every 15 minutes [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. Twitter’s Search API was used in 2 studies (<xref ref-type="table" rid="table2">Table 2</xref>). There are programs developed to interact between Twitter’s Search API and specific analyses programs. For example, twitteR package for R [<xref ref-type="bibr" rid="ref16">16</xref>], NCapture for NVivo [<xref ref-type="bibr" rid="ref17">17</xref>], and Social Network Importer for NodeXL, the free add-on for Excel [<xref ref-type="bibr" rid="ref18">18</xref>], provide access to Twitter’s Search API. A small subset of the studies used these programs: twitteR package for R (n=1), NCapture (n=1), and Social Network Importer for NodeXL (n=1).</p>
          <p>More useful to researchers is Twitter’s Streaming API, which provides all tweets related to the search terms up to a limit of 1% of the Twitter database for that time period. If the selected search terms are infrequently used across Twitter (eg, the name of a local tobacco campaign), all tweets related to the search terms will be available. However, if the selected search terms are commonly used, tweets related to those terms will be available up to a limit of 1% of the current Twitter database. Twitter’s Streaming API is free, publicly available data [<xref ref-type="bibr" rid="ref19">19</xref>]. A total of 5 studies used Twitter’s Streaming API (<xref ref-type="table" rid="table2">Table 2</xref>). Twitonomy is an analytics tool that accesses Twitter’s Streaming API and offers both free and premium packages for a small fee [<xref ref-type="bibr" rid="ref20">20</xref>]. One article used Twitonomy.</p>
          <p>Providing the greatest access to data, Twitter’s Firehose has real-time access to 100% of Twitter content. Twitter’s Firehose formerly was handled by multiple data providers (eg, Gnip, DataSift, and Topsy). After the acquisition of Gnip in 2014, Twitter transitioned to only allowing access to Twitter’s Firehose through Gnip for a fee from August 2015 onward [<xref ref-type="bibr" rid="ref21">21</xref>]. A total of 6 articles used Gnip, making it the most common method to collect data (<xref ref-type="table" rid="table2">Table 2</xref>). There are social listening programs that buy Twitter data from data providers such as Gnip. Radian6 [<xref ref-type="bibr" rid="ref22">22</xref>], Simply Measured [<xref ref-type="bibr" rid="ref23">23</xref>], and Sysomos Heartbeat [<xref ref-type="bibr" rid="ref24">24</xref>] collect data from across social networking sites, blogs, forums, and news sites for a fee. A few articles used these social listening programs to collect data: Radian6 (n=2), Simply Measured (n=1), and Sysomos Heartbeat (n=1).</p>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Data collection methods.</p>
            </caption>
            <table width="746" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="35"/>
              <col width="70"/>
              <col width="125"/>
              <col width="220"/>
              <col width="60"/>
              <col width="53"/>
              <col width="50"/>
              <thead>
                <tr valign="top">
                  <td>Article</td>
                  <td>Date collected</td>
                  <td>Type of tweets or accounts</td>
                  <td>Keyword selection<sup>a,b</sup></td>
                  <td>Data source</td>
                  <td>Retrieval precision</td>
                  <td>Retrieval recall</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>]</td>
                  <td>March 22 to June 27, 2015</td>
                  <td>Tweets about the California Department of Public Health “Still Blowing Smoke” <break/>media campaign about the harms of e-cigarettes and the pro–e-cigarette campaign “Not Blowing Smoke”</td>
                  <td>#stillblowingsmoke, stillblowingsmoke, “still <break/>blowing smoke”, stillblngsmoke, “still blng smoke”, #notblowingsmoke, notblowingsmoke, “not blowing smoke”, notblngsmoke, “not blng smoke”, <break/>@CAPublicHealth</td>
                  <td>Gnip</td>
                  <td>97.5%</td>
                  <td>NR<sup>c</sup></td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>]</td>
                  <td>May 1, 2013, to May 1, 2014</td>
                  <td>E-cigarettes</td>
                  <td>vaping, vape, vaper, vapers, vapin, vaped, evape, vaporing, e-cig*, ecig*, e-pen, epen, e-juice, ejuice, e-liquid, eliquid, cloud chasing, cloudchasing, deeming AND regulation, deeming AND FDA, deemed AND FDA, deem* AND FDA</td>
                  <td>Gnip</td>
                  <td>59.23%</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                  <td>July 1, 2008, to February 28, 2013</td>
                  <td>E-cigarettes</td>
                  <td><italic>55 keywords (only examples reported)</italic>: <italic>general e-cigarette terms</italic> (<italic>eg,</italic> electronic cigarette, eCig), <break/><italic>specific brand names</italic> (<italic>eg,</italic> blu, NJoy, green smoke), <italic>and terms about e-cigarette use</italic> (<italic>eg</italic>, vaping) <break/><italic>Excluded words related to tobacco or drugs (only examples reported)</italic>: marijuana, hookah</td>
                  <td>Radian6</td>
                  <td>91%</td>
                  <td>93%</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>]</td>
                  <td>December 5, 2011, to July 17, 2012 (15-day intervals)</td>
                  <td>Tobacco</td>
                  <td>cig*, nicotine, smok*, tobacco; hookah, shisha, <break/>waterpipe, e-juice, e-liquid, vape <italic>and</italic> vaping</td>
                  <td>Twitter’s <break/>Streaming API<sup>d</sup></td>
                  <td>57.25%</td>
                  <td>95%-99%</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref28">28</xref>]</td>
                  <td>January 1 to December 31, 2014</td>
                  <td>E-cigarettes and smoking cessation</td>
                  <td><italic>E-cigarette keywords</italic>: vaping, vaper, vapes, vapers, e-cigarette, e-cig, mod, eGo, mod, RBA, RDA, vape, “vape pen”, “e-hookah”, “e-pipe”, “e-shisha”, “hookah pen”, “vape pipe”, #vape #vapelife #vapor #vapeporn #vapenation #vapestars #vaperazzi <break/>#vapingstyle #vaperevolution #vapeswag #vapesirens #vaperscommunity #vapepics #vapesociety <break/>#socialvapers #vapefamily #vapefreedom #vapelove #vapers #vapstagram #vapelyfe #vapeshop #vapeon #vapestrong #girlswhovape #alldayvape #adv #vapersoul #VGOD #ecig #ecigarette <break/><italic>Smoking cessation keywords</italic>: quit, stop, “quit <break/>smoking”, “stop smoking”, “quit cigarettes”, “smoke less”, “smoking less”, help, NRT, patch, lozenge, spray, gum, nicorette, nicotine, #quit #quitsmoking #quitsmokingcigarettes #Cessationnation <break/><italic>Exclusion keywords</italic>: marijuana, weed, pot, dank, trees, green, cheeba, THC, cannabis, sativa, indica, bud, marihuana, MJ, “mary jane”</td>
                  <td>Sysomos <break/>Heartbeat</td>
                  <td>NR</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref29">29</xref>]</td>
                  <td>February 1 to April 30, 2014</td>
                  <td>Blu e-cigarettes’ tweets and retweets</td>
                  <td>@blucigs</td>
                  <td>Twitter REST API</td>
                  <td>NR</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref30">30</xref>]</td>
                  <td>April 12 to May 10, 2014</td>
                  <td>Hookah or shisha</td>
                  <td>hookah, #hookah, shisha, #shisha, hooka, #hooka, sheesha, #sheesha</td>
                  <td>Simply <break/>Measured</td>
                  <td>99.56%</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                  <td>November 1, 2011, to August 31, 2013</td>
                  <td>Hookah, cigarettes, and cigars</td>
                  <td>cigar, cigars, cigarette, cigarettes, hookah, waterpipe, water pipe, shisha, sheesha</td>
                  <td>Twitter’s <break/>Streaming API</td>
                  <td>NR</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref32">32</xref>]</td>
                  <td>October 4 to November 3, 2010</td>
                  <td>Tobacco</td>
                  <td>Smoking, tobacco, cigarette, cigar, hookah, hooka</td>
                  <td>Twitter’s <break/>Search API</td>
                  <td>NR</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                  <td>May 1, 2012, to June 30, 2012</td>
                  <td>E-cigarettes</td>
                  <td><italic>Keywords</italic>: e-cigarette, ecigarette, e-cig, ecig <break/><italic>Additional keywords AND “cig” or “cigarette”</italic>: electronic, blu, njoy</td>
                  <td>Gnip</td>
                  <td>&#62;99% of a random sample of 500 tweets</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref34">34</xref>]</td>
                  <td>December 6, 2012, to June 20, 2013</td>
                  <td>Tobacco or cessation price promotion</td>
                  <td><italic>Tobacco-related</italic>: cig(s), cigarette(s), smoking, <break/>tobacco, blu cigarette, njoy cigarette, ecig, e-cig, @blucig, e-cigarette, ecigarette, from:blucigs*, ecigs, e-cigs, ecigarettes, e-cigarettes, “green smoke”, “south beach smoke”, cartomizer, (atomizer OR <break/>atomizers) –perfume*, ehookah OR e-hookah, ejuice OR ejuices OR e-juice OR e-juices, eliquid OR <break/>eliquids OR e-liquid OR e-liquids, e-smoke OR e-smokes, (esmoke OR esmokes), eversmoke, “joye 510”, joye510, lavatube OR lavatubes, logicecig OR logicecigs, smartsmoker, smokestik OR smokestiks, “v2 cig” OR “v2 cigs” OR v2cig OR v2cigs, vaper OR vapers OR vaping, zerocig OR zerocigs, <break/>cartomizers, Vuse, MarkTen <break/><italic>Price-related</italic>: Coupon(s), Promo(s), Promotions(s), Promotional, Discount(s)(ed), Save, Code(s)</td>
                  <td>Gnip</td>
                  <td>56.94%</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                  <td>July 2014</td>
                  <td>Slogans for the Dutch health campaign “Smoking is so outdated” (Roken kan echt niet meer)</td>
                  <td>#rokenkanechtnietmeer [#smokingissooutdated]</td>
                  <td>Twitter’s <break/>Search API</td>
                  <td>NR</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                  <td>December 2013</td>
                  <td>Little cigars</td>
                  <td>Swisher Sweets, Black &#38; Milds</td>
                  <td>Twitonomy</td>
                  <td>67.50%</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                  <td>September 2012 and January to May 2013</td>
                  <td>Genetic information on smoking</td>
                  <td>genetic, smoking</td>
                  <td>NR</td>
                  <td>49.1%</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                  <td>August 2010</td>
                  <td>Smoking cessation accounts</td>
                  <td><italic>Searched for smoking cessation accounts using the following terms</italic>: “quit or stop smoking” or “smoking cessation”</td>
                  <td>NR</td>
                  <td>NR</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                  <td>January 8-15, 2014</td>
                  <td>Tweets about Chicago <break/>Department of Public Health’s e-cigarette Twitter campaign</td>
                  <td>@ChiPublicHealth</td>
                  <td>twitteR package for R and NodeXL</td>
                  <td>NR</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref40">40</xref>]</td>
                  <td>January 2010 to January 2015</td>
                  <td>E-cigarettes</td>
                  <td>vape, ecig, ecigarette, vaping, ejuice, vapers, drip AND tip, dripping, eliquid AND flavor, e AND juice, e AND liquid, smoke AND free, off AND cigarettes, ex AND smoker, no AND analogs, I AND quit</td>
                  <td>NR</td>
                  <td>NR</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref41">41</xref>]</td>
                  <td>January 2012 to December 2014</td>
                  <td>E-cigarettes</td>
                  <td>e(-)cig, e(-)cigarette, electronic cigarette, <italic>etc</italic></td>
                  <td>Twitter’s Streaming API</td>
                  <td>81% to 90.8% for 4 groups <break/>of 500 <break/>randomly sampled automated tweets</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref42">42</xref>]</td>
                  <td>September to December 2013 and March 2015</td>
                  <td>E-cigarettes</td>
                  <td>Electronic-cigarette, e-cig, e-cigarette, e-juice, <break/>e-liquid, vape-juice, vape-liquid</td>
                  <td>Twitter’s Streaming API and Twitter’s Firehose</td>
                  <td>97.21%</td>
                  <td>86.63%</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref43">43</xref>]</td>
                  <td>April 21 to October 20, 2014</td>
                  <td>Blu and V2 e-cigarettes’ tweets and retweets</td>
                  <td>@blucigs, @v2cigs</td>
                  <td>NR</td>
                  <td>100%</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref44">44</xref>]</td>
                  <td>July 7 to 21, 2014</td>
                  <td>Tweets about the Centers for Disease Control and <break/>Prevention’s (CDC) Tips From Former Smokers <break/>campaign</td>
                  <td>#cdctips, CDC AND smoking</td>
                  <td>Social <break/>Network <break/>Importer for NodeXL</td>
                  <td>81.70%</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                  <td>May 1, 2013, to May 1, 2014</td>
                  <td>E-cigarettes</td>
                  <td>vaping, vape, vaper, vapers, vapin, vaped, evape, vaporing, e-cig*, ecig*, e-pen, epen, e-juice, ejuice, e-liquid, eliquid, cloud chasing, cloudchasing, deeming AND regulation, deeming AND FDA, deemed AND FDA, deem* AND FDA</td>
                  <td>Gnip</td>
                  <td>59.23%</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref46">46</xref>]</td>
                  <td>March to June 2013</td>
                  <td>Tobacco control program tweets during the months that the national CDC Tips smoking cessation campaign aired</td>
                  <td><italic>Google search for tobacco control programs using the terms “</italic> tobacco program <italic>” and “</italic> quitline <italic>.” If the site included a link to a Twitter account, that</italic> <break/><italic>account was included</italic>.</td>
                  <td>Radian6</td>
                  <td>NR</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref47">47</xref>]</td>
                  <td>March 15 to June 9, 2012</td>
                  <td>Tweets about the CDC’s Tips campaign</td>
                  <td><italic>Tobacco behavior</italic>: cig(s), cigarette(s), nicotine, smoke(s), smoker, smoking, tobacco <break/><italic>Tobacco policy</italic>: @cdcgov, @cdctobaccofree, <break/>@drfriedencdc, @fdatobacco, @smokefreegov, <break/>antitobacco, antismoking, CDC, quitline, quitnow, secondhand+smoke, smokefree, smokefree.gov, <break/>tobaccofree <break/><italic>Ad specific</italic>: #cdctips, amputation, amputee, <break/>Buerger’s+Disease, heart+attack, hole+neck, hole+throat, lung+cancer, stoma, stroke, <break/>throat+cancer <break/><italic>Engagement</italic>: ad, commercial, campaign, PSA</td>
                  <td>Gnip</td>
                  <td>78.87%</td>
                  <td>94%</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref48">48</xref>]</td>
                  <td>February 5-12, 2014</td>
                  <td>CVS Health-related tweets surrounding the <break/>announcement of ending <break/>tobacco sales</td>
                  <td>#cvs, #cvsquits</td>
                  <td>Twitter’s Streaming API</td>
                  <td>72.38%</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                  <td>50 most recent tweets from July 18, 2012</td>
                  <td>Smoking cessation accounts</td>
                  <td><italic>Searched for smoking cessation accounts using the terms</italic>: “quit smoking” <italic>and</italic> “smoking cessation”</td>
                  <td>NR</td>
                  <td>NR</td>
                  <td>NR</td>
                </tr>
                <tr valign="top">
                  <td>[<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                  <td>February 23 to April 9, 2015</td>
                  <td>Exposure to secondhand e-cigarette aerosol</td>
                  <td>“secondhand vape” OR “secondhand vaping” OR “second-hand vape” OR “second-hand vaping” OR “vape smoke” OR “ecig smoke” OR “e-cig smoke” OR “e-cigarette smoke” OR “vape shs” OR “ecig shs” OR “vape <break/>secondhand smoke” OR “vape second-hand smoke” OR “esmoke” OR “e-smoke”</td>
                  <td>NCapture</td>
                  <td>NR</td>
                  <td>NR</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table2fn1">
                <p><sup>a</sup>Asterisk (*) represents stemmed words; for example, cig* would capture all words beginning with cig.</p>
              </fn>
              <fn id="table2fn2">
                <p><sup>b</sup>Words in italics were not keywords used for searches.</p>
              </fn>
              <fn id="table2fn3">
                <p><sup>c</sup>NR: not reported.</p>
              </fn>
              <fn id="table2fn4">
                <p><sup>d</sup>API: application programming interface.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Date Collected</title>
          <p>Twitter data were collected across the studies from 2008 to 2015. The time span of Twitter data collected within an individual study ranged from 1 day to 5 years with a median of 14 weeks (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
        </sec>
        <sec>
          <title>Tobacco Topics</title>
          <p>Among the 27 studies, 41% (n=11) analyzed messages related to e-cigarettes, 19% (n=5) related to other tobacco products, and 22% (n=6) about specific tobacco campaigns (<xref ref-type="table" rid="table2">Table 2</xref>). The remaining topics included smoking cessation accounts (n=2), tobacco or cessation price promotion (n=1), genetic information on smoking (n=1), and ending tobacco sales at CVS Health (n=1).</p>
        </sec>
        <sec>
          <title>Search Keyword Selection</title>
          <p>Kim and colleagues [<xref ref-type="bibr" rid="ref11">11</xref>] proposed a framework of three steps to develop and validate search filters. This framework was selected because it provided a standard in which to compare studies. Most of the articles partially fulfilled these steps within the framework. The first step is to develop a search filter. All the articles generated a list of keywords presumably based on expert knowledge of the topic or a systematic search of language related to the topic of interest. However, only 4 articles discussed the process of discarding keywords that returned a high proportion of irrelevant results and adding new keywords as new terms appeared in the returned literature [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref28">28</xref>]. It should be noted that for some studies this process of developing a search filter may be irrelevant because they are coding all tweets from a specific account (eg, coding tweets from the blu e-cigarette account, @blucigs) [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
          <p>Search keyword selection was tailored to the studies’ specific topics (<xref ref-type="table" rid="table2">Table 2</xref>). To search for e-cigarette Twitter data, variations on e-cigarette (eg, e-cig), vape (eg, vaping), e-liquid (eg, eliquid), and e-juice (eg, ejuice) were common. Some e-cigarette studies also included major e-cigarette companies or brands as key search terms (eg, Njoy). Studies that analyzed Twitter data on specific tobacco campaigns used a variety of tactics such as searching for variations on the campaign name (eg, still blowing smoke), the source of the campaign (eg, CDC), specific features of the campaign ads (eg, lung+cancer), tobacco products and behavior (eg, smoke), and general campaign terms (eg, PSA). Some studies also used a combination of searching for terms with and without hashtags (eg, hookah, #hookah). In 2 studies, marijuana terms (eg, weed) were used as exclusion keywords [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref28">28</xref>].</p>
          <p>The second step of the framework is to apply the search filter and split data into retrieved and unretrieved sets. The third step is to assess the search filter on its ability to distinguish between relevant and irrelevant messages [<xref ref-type="bibr" rid="ref11">11</xref>]. Precision refers to how much retrieved data are relevant, whereas recall refers to how much relevant data are retrieved. Recall is similar to measures of sensitivity. Precision is much less difficult to accurately estimate than recall because recall requires conclusions to be drawn about the tweets that were not retrieved. A precision score of 100% means that all retrieved data were relevant, while a recall score of 100% means that all relevant data were retrieved. However, precision and recall are inversely related. As a search filter expands to collect more data, the proportion of relevant data decreases. Publications can present a precision-recall curve to show the extent of this trade-off for their search filter. A good search filter will maintain a relatively high level of precision as recall increases. A total of 15 articles reported precision, which ranged from 49.1% to 100% (<xref ref-type="table" rid="table2">Table 2</xref>). A total of 4 articles reported recall, which ranged from 86.6% to 99% (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
        </sec>
      </sec>
      <sec>
        <title>Coding Methods</title>
        <p>Coding methods for the studies included hand-coding, machine learning, or a combination of the two. Hand-coding involves one or more human coders categorizing data. When 2 or more coders independently code data, a coding agreement score (eg, kappa) between the coders can be calculated. In contrast, machine learning uses an algorithm for a computer to learn how to code data. However, human-coding is used for an initial subset of data to help refine the algorithm to improve its accuracy. Coding categories may be determined a priori based on prior research or they may be developed inductively through the process of coding. Studies used hand-coding only (n=17), machine learning + hand-coding (n=8), and machine learning only (n=2; <xref ref-type="table" rid="table3">Table 3</xref>). Of the studies using hand-coding, data were coded by the reviewed studies’ researchers in 16 studies, while 1 study used crowdsourcing (ie, many Web workers) [<xref ref-type="bibr" rid="ref30">30</xref>]. All the studies that used machine learning also used initial hand-coding for a subset of the data, except for 2 studies that used topic modeling [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. Topic modeling produces thematically related word clusters from the text [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        <p>The data collected in the hand-coded studies ranged from a collection period of 1 day to 1 year, while the machine learning studies ranged from 1 month to 5 years of Twitter data. Across the articles that used hand-coding, the number of coders per tweet ranged from 1 to 6. Coding agreement was reported by 20 articles: coding agreement percentage (n=5; 72% to 95.7%), kappa scores (n=13; kappa=.64 to 1.00), Cronbach alpha (n=1; alpha=.61 to 1.00), and both coding agreement percentage and kappa scores (n=1). Kappa values can be interpreted as poor (&#60;.20), fair (.21-.40), moderate (.41-.60), good (.61-.80), and very good (.81-1.00) [<xref ref-type="bibr" rid="ref51">51</xref>]. Cronbach alpha can be interpreted as unacceptable (&#60;.50), poor (.50-.59), questionable (.60-.69), acceptable (.70-.79), good, (.80-.89), and excellent (&#62;.90) [<xref ref-type="bibr" rid="ref52">52</xref>]. However, it is important to note that these thresholds are not derived statistically but instead rely on intuitive judgments. The number of tweets coded per study ranged from 171 to 17,098 for hand-coding and from 7362 to 1,669,123 for machine learning. A total of 14 articles included retweets in their total number of tweets. A total of 15 articles reported the number of unique Twitter accounts, which ranged from 2 to 3804 for hand-coding studies and from 23,700 to 166,857 for machine learning studies (see <xref ref-type="table" rid="table3">Table 3</xref>).</p>
        <p>URLs in tweets can provide information that changes the context or meaning of a tweet. Following URLs to their respective webpages can be time-consuming, but it can increase coding accuracy. Machine learning algorithms can analyze the text within URLs but may require human coders to follow them to their respective webpages. A total of 15 articles reported whether they followed URLs (followed: n=10, did not follow: n=5; <xref ref-type="table" rid="table3">Table 3</xref>). One article provided the most common URLs [<xref ref-type="bibr" rid="ref26">26</xref>]. The studies tended to show that advertising or commercial tweets were significantly more likely to contain URLs than other types of tweets [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>].</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Coding methods.</p>
          </caption>
          <table width="752" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="35"/>
            <col width="70"/>
            <col width="90"/>
            <col width="80"/>
            <col width="70"/>
            <col width="65"/>
            <col width="70"/>
            <col width="50"/>
            <thead>
              <tr valign="top">
                <td>Article</td>
                <td>Coding method</td>
                <td>No. of coders</td>
                <td>No. of tweets coded</td>
                <td>Coded retweets</td>
                <td>No. of Twitter accounts</td>
                <td>Followed URLs</td>
                <td>Coding <break/>agreement</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref8">8</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>1: all tweets; <break/>2: subsample 300 tweets</td>
                <td>2248: relevance; <break/>2192: content</td>
                <td>Yes</td>
                <td>NR<sup>a</sup></td>
                <td>No</td>
                <td>91%: <break/>sentiment; <break/>72%: theme</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref25">25</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>6: for a subset of 250 tweets; <break/>NR for total</td>
                <td>17,098: relevance; <break/>10,128: content</td>
                <td>Yes, if additional context</td>
                <td>NR</td>
                <td>Yes</td>
                <td>κ=.64 to .70</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                <td>Machine learning with initial hand-coding; Python Scikit-Learn</td>
                <td>NR</td>
                <td>1,669,123</td>
                <td>Yes</td>
                <td>NR</td>
                <td>Yes</td>
                <td>NR</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref27">27</xref>]</td>
                <td>Machine learning and hand-coding; naïve Bayes, <break/>k-nearest <break/>neighbors, and support vector machines</td>
                <td>2: pilot of 1000; <break/>2: random subset of 150; <break/>2: all 7362</td>
                <td>7362: relevance; <break/>4215: content</td>
                <td>Retweeted posts were only<break/>included once</td>
                <td>NR</td>
                <td>NR</td>
                <td>κ&#62;.70 for the random subset of 150</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref28">28</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>1: all tweets; <break/>2: for 10% subsample</td>
                <td>300: complete sample; <break/>300: industry-free sample; <break/>481 of 600: content (duplicates between samples removed)</td>
                <td>Yes</td>
                <td>148: complete sample; <break/>215: industry-free sample</td>
                <td>Yes</td>
                <td>κ=.74</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref29">29</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>2</td>
                <td>NR</td>
                <td>Yes</td>
                <td>Approximately 3400</td>
                <td>NR</td>
                <td>NR</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref30">30</xref>]</td>
                <td>Crowdsourcing with initial hand-coding</td>
                <td>3</td>
                <td>5000: relevance; <break/>4978: content</td>
                <td>NR</td>
                <td>3804</td>
                <td>NR</td>
                <td>κ=.66 to .85 among a subset coded by researchers</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                <td>Topic modeling with machine learning; <break/>MALLET, a command-line implementation of latent Dirichlet allocation (LDA)</td>
                <td>NR</td>
                <td>319,315: total; <break/>95,738: hookah; <break/>22,513: cigar; <break/>201,064: cigarette</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref32">32</xref>]</td>
                <td>Topic modeling (LDA) with <break/>machine learning</td>
                <td>NR</td>
                <td>4962</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
                <td>NR</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td>Machine learning and hand-coding; DiscoverText</td>
                <td>2: for a subset of 500 for relevance, 4500 for commercial versus <break/>organic, 7500 for <break/>cessation</td>
                <td>73,672</td>
                <td>Yes</td>
                <td>23,700</td>
                <td>Yes, hand-coded tweets with URLs</td>
                <td>κ=.87 to .93</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref34">34</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>1: all; <break/>2: for subsets of 100 tweets</td>
                <td>5000: relevance; <break/>2847: content</td>
                <td>NR</td>
                <td>NR</td>
                <td>Yes</td>
                <td>κ=.64 to 1.00</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>1: all tweets; <break/>3: subsample</td>
                <td>133</td>
                <td>No</td>
                <td>NR</td>
                <td>NR</td>
                <td>alpha = .61 to 1.00</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>3</td>
                <td>3935: relevance, <break/>foreign language, retweets; <break/>2656 sampled for 288 original tweets for coding</td>
                <td>No</td>
                <td>346</td>
                <td>Yes</td>
                <td>κ=.64 to .91</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                <td>Hand-coded by researchers; wordcloud R package</td>
                <td>NR</td>
                <td>171: relevance; <break/>84: content</td>
                <td>NR</td>
                <td>84</td>
                <td>NR</td>
                <td>NR</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>1: all tweets; <break/>2: for 20% of tweets</td>
                <td>143,287: identified; <break/>4753: coded for clinical practice guidelines for <break/>treating tobacco <break/>dependence</td>
                <td>NR</td>
                <td>153</td>
                <td>Yes</td>
                <td>&#62;90%</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>2</td>
                <td>684</td>
                <td>Yes</td>
                <td>306</td>
                <td>Yes</td>
                <td>NR</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref40">40</xref>]</td>
                <td>Machine learning and hand-coding; naïve Bayes, <break/>LIBLINEAR, Bayesian logistic regression, <break/>random forests; keyword <break/>comparisons</td>
                <td>1: all tweets; <break/>2: subsample of 2000</td>
                <td>13,146</td>
                <td>NR</td>
                <td>2147</td>
                <td>No, removed URLs</td>
                <td>κ=.87 for subsample</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref41">41</xref>]</td>
                <td>Machine learning and hand-coding; human detection algorithm; <break/>Hedonometrics; key phrasal <break/>pattern matching</td>
                <td>2: for all tweets from 500 automated accounts and 500 organic <break/>accounts as classified by the algorithm; <break/>2: for 4 groups of 500 randomly sampled tweets to gauge <break/>accuracy of <break/>subcategorical tweet topics</td>
                <td>850,000</td>
                <td>Yes</td>
                <td>131,622: <break/>automated <break/>accounts; <break/>134717: organic accounts: <break/>188,182: not classified <break/>accounts (ie, <break/>accounts with &#60;25 tweets)</td>
                <td>No, but the <break/>algorithm used the count of URLs to <break/>distinguish <break/>automated <break/>accounts from <break/>organic accounts; also used <break/>keywords in the URLs for the <break/>algorithm to <break/>determine <break/>subcategories of automated <break/>accounts</td>
                <td>94.6% true- <break/>positive rate, 12.9% false- <break/>positive rate for the machines on the tweets from the 1000 <break/>accounts <break/>also coded with <break/>human-coding</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref42">42</xref>]</td>
                <td>Machine learning with initial hand-coding; Python Scikit-Learn; <break/>topic modeling with MALLET</td>
                <td>2: for a subset of 1000 profiles</td>
                <td>224,000 in 2013 sample; <break/>349,401 in 2015 sample</td>
                <td>Yes</td>
                <td>34,000 in 2013 sample; <break/>100,000 in 2015 sample</td>
                <td>No; metadata on the presence of URL links</td>
                <td>κ=.88</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref43">43</xref>]</td>
                <td>Hand-coded by researchers and MySQL pattern matcher</td>
                <td>NR</td>
                <td>1180</td>
                <td>Yes</td>
                <td>2: Blu and V2; <break/>537: users retweeting Blu and V2</td>
                <td>NR</td>
                <td>NR</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref44">44</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>1: all tweets; <break/>2: for 20% of tweets (n=358)</td>
                <td>2191: relevance; <break/>1790: content</td>
                <td>Yes</td>
                <td>NR (&#62;21)</td>
                <td>NR</td>
                <td>κ=.95 for 20% <break/>subsample</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                <td>Machine learning with initial hand-coding; naïve Bayes classifier, k-nearest <break/>neighbors, <break/>support vector machines</td>
                <td>6: for a subset of 250 tweets; <break/>NR for total</td>
                <td>17,098: relevance; <break/>10,128: content</td>
                <td>Yes, if additional context</td>
                <td>NR</td>
                <td>NR</td>
                <td>κ=.64 to .70</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref46">46</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>3</td>
                <td>1776</td>
                <td>No</td>
                <td>16</td>
                <td>Yes</td>
                <td>For 5% of data, 95.7%; <break/>κ=.72</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref47">47</xref>]</td>
                <td>Machine learning with initial hand-coding; naïve Bayes classifier</td>
                <td>2: subset of 450 tweets for relevance; <break/>2: subset of 350 tweets for content</td>
                <td>245,319: relevance; <break/>193,491: content</td>
                <td>NR</td>
                <td>166,857</td>
                <td>NR; metadata on the presence of URL links</td>
                <td>κ=.93</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref48">48</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>1: all tweets; <break/>2: for 1% of tweets</td>
                <td>8645: relevance; <break/>6257: content</td>
                <td>Yes</td>
                <td>NR</td>
                <td>Yes</td>
                <td>90% for a 1% sample of tweets</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>2</td>
                <td>900, with 50 tweets per account</td>
                <td>Yes</td>
                <td>18</td>
                <td>NR</td>
                <td>84%</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                <td>Hand-coded by researchers</td>
                <td>2</td>
                <td>1519</td>
                <td>No</td>
                <td>1321</td>
                <td>Yes</td>
                <td>κ=.84</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>NR: not reported.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Coded Categories</title>
        <p>All the studies developed categories for content. These content areas included one or more of the following: sentiment, theme, location of use, user description, profile photo, or location of user (<xref ref-type="table" rid="table4">Table 4</xref>).</p>
        <sec>
          <title>Sentiment</title>
          <p>A total of 9 articles coded for sentiment (<xref ref-type="table" rid="table4">Table 4</xref>). One article made a distinction between coding for sentiment (ie, emotional tone or affective content: positive, negative, or neutral) and message attitude (ie, pro, con, neutral or do not know) [<xref ref-type="bibr" rid="ref28">28</xref>]. Two articles coded for sentiment in terms of emotional tone. In 6 articles, sentiment was described in terms of being supportive or against tobacco, tobacco users, or decisions regarding tobacco, which suggests an assessment of message attitude. Furthermore, 1 article assessed valence, but it was not clear whether positive or negative valence suggested an attitude or emotional tone [<xref ref-type="bibr" rid="ref35">35</xref>].</p>
        </sec>
        <sec>
          <title>Topic or Theme</title>
          <p>A total of 21 studies coded for topic or theme (<xref ref-type="table" rid="table4">Table 4</xref>). The most common themes included the following: advertisement, marketing, industry or commercial (n=12 articles); health, safety, harms (n=9); use (n=8); policy, government, regulation, activism (n=7); e-cigarettes for smoking cessation (n=7); flavors (n=7); personal opinion or communication (n=6); risky behaviors or other substances (n=6); cessation (n=5); information (n=5), and craving or need (n=5). One study coded for location of use with 20 categories (eg, school, work) [<xref ref-type="bibr" rid="ref26">26</xref>]. Finally, 2 studies used topic modeling to explore tobacco content [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>].</p>
        </sec>
        <sec>
          <title>User or Account</title>
          <p>A total of 10 studies coded for user description from data found in the user profile, including type of account, age, location, and other characteristics (<xref ref-type="table" rid="table4">Table 4</xref>). The most common types of user categories coded were personal accounts (n=7 articles), industry accounts (n=5), news (n=5), unclassified (n=5), and bots, automatic, or fake (n=4; ie, automated computer program). None of the articles reported the percentage of tweets that had accounts without user profile information. However, across the articles with a category for tweets with an unclassifiable user description, 0.2%-38% of tweets were unclassified. Across the studies that coded for bots, the percentages of tweets varied drastically from 6.9% to 80.7%.</p>
          <p>One study coded Twitter profile photos with 4 categories: gender, age, race, and single person versus multiple people [<xref ref-type="bibr" rid="ref36">36</xref>]. Visual cues (eg, skin color, background themes, facial features) in the profile pictures were used for coding. Coding for age based on available visual cues in the profile photos tended to be difficult, so coding for age was simplified to 3 broad groups: young, middle age, and older adult. There were few middle-aged and older adults represented in the sample, so a dichotomous variable of young or not young was created [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
          <p>A total of 4 studies coded for the location of the user with one each coding for state (California vs other) [<xref ref-type="bibr" rid="ref8">8</xref>], country [<xref ref-type="bibr" rid="ref37">37</xref>], continent [<xref ref-type="bibr" rid="ref38">38</xref>], and city, state, and country (United States vs other) [<xref ref-type="bibr" rid="ref39">39</xref>]. Location was identified for 51% to 63% of Twitter profiles. Most accounts that listed a location were from the United States and North America.</p>
          <table-wrap position="float" id="table4">
            <label>Table 4</label>
            <caption>
              <p>Coded categories.</p>
            </caption>
            <table width="746" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="110"/>
              <col width="20"/>
              <col width="240"/>
              <col width="90"/>
              <col width="140"/>
              <thead>
                <tr valign="top">
                  <td>Category type</td>
                  <td colspan="2">Category</td>
                  <td>Number of articles and percent of total<sup>a</sup>  <break/>n (%)</td>
                  <td>Articles</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Relevance</td>
                  <td colspan="2">Relevant versus nonrelevant</td>
                  <td>16 (59)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref47">47</xref>-<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>Sentiment</td>
                  <td colspan="2"><break/></td>
                  <td>9 (33)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Positive or negative (ie, supportive or against)</td>
                  <td>6 (22)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Positive or negative (ie, emotional tone)</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Positive or negative valence</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Neutral or unknown</td>
                  <td>6 (22)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>Message attitude</td>
                  <td colspan="2">Pro or con</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref28">28</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>Type of utterance</td>
                  <td colspan="2">Comparison versus attribution versus metonymy</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>Topics, themes, or genres</td>
                  <td colspan="2"><break/></td>
                  <td>21 (78)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref45">45</xref>-<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Joke or humorous</td>
                  <td>3 (11)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Song or music</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Profanity</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Social relationships</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Sex or romance</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref30">30</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Image or stereotype</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Risky behaviors or other substances</td>
                  <td>6 (22)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Illicit substance use in e-cigarettes</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Preference for another substance</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref30">30</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Affiliation and preference</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Flavors</td>
                  <td>7 (26)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref41">41</xref>-<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Pleasure</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Tastes good</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref28">28</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Craving, desire, and need</td>
                  <td>5 (19)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Addiction</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Type of tobacco product</td>
                  <td>4 (15)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Type of tobacco product brand</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">E-cigarettes’ smoke-free aspect</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref42">42</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Health, safety, harms</td>
                  <td>9 (33)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Downplayed or refuted harms, harm reduction</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref42">42</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">E-cigarettes for smoking cessation</td>
                  <td>7 (26)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref40">40</xref>-<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Cessation</td>
                  <td>5 (19)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref46">46</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Cessation product</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Socioemotional support tweets regarding quitting smoking</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Encouraging or engaging tweets regarding quitting smoking</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Clinical practice guidelines for treating tobacco dependence</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Demonstration</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2"><bold>Use</bold></td>
                  <td>8 (30)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Use: general</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>First-person use or intent</td>
                  <td>5 (19)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Second- or third-person experience</td>
                  <td>4 (15)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Starting use or smoking initiation</td>
                  <td>3 (11)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Recent use</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref30">30</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Underage use</td>
                  <td>3 (11)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Parental use</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Does not use or does not want to use</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref30">30</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Secondhand smoke</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref46">46</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Rejection and prevention</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Disgust, unattractive, or uncool</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Policy, government, regulation, activism, politics</td>
                  <td>7 (26)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Normalization versus discouragement</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref30">30</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Getting others started or advocating use</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref28">28</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Attempt to engage other Twitter users</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref28">28</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Fear appeals</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref47">47</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Lies or propaganda</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Advertisement, promotion, marketing, industry, commercial</td>
                  <td>12 (44)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Offering advice</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref28">28</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Personal opinion or communication</td>
                  <td>6 (22)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">News or update</td>
                  <td>4 (15)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Information</td>
                  <td>5 (19)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Science or scientific publication</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Cultural reference</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Issue salience</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Commodity</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Connoisseurship</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Cheaper than smoking</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref28">28</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Money</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Price promotion, discount, coupon</td>
                  <td>4 (15)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Backgrounded</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref27">27</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Other or undetermined</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>Domains smoking was compared with for <break/>campaign slogans</td>
                  <td colspan="2">Personal features; hobby or hype; person or group; social norm; big event; technology and innovation; sex or relation; eating, drinking, and stimulants; school; transport; and campaign</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>Links (URLs)</td>
                  <td colspan="2">Most common links</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>Location of use</td>
                  <td colspan="2"><break/></td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Class</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">House, room, bed</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">School</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Public</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Bathroom</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Work</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">In front of someone</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Car</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Restaurant</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Movie theater</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Airplanes or airport</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Store</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Bars or clubs</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Dormitory</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Library</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Mall</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Bowling alley</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Café or coffee shop</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Hospital</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Locker room</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref26">26</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>Topic modeling</td>
                  <td colspan="2"><break/></td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Hookah topic 1: social locations, leisure time, and positive affect</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Hookah topic 2: fun, leisure time, and sociability</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Cigarette topic 1: death and unpleasant smell</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Cigar topic 1: positive affect and enjoyment</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Cigar topic 2: luxury alcohol products</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Tobacco topic 1: tobacco use and substance use</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref32">32</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Tobacco topic 2: addiction recovery</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref32">32</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Tobacco topic 3: addiction recovery and tobacco promotion by clubs or bars</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref32">32</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Tobacco topic 4: tobacco promotion by bars or clubs and <break/>marijuana use</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref32">32</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Tobacco topic 5: antismoking and addiction recovery</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref32">32</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>User or account</td>
                  <td colspan="2"><break/></td>
                  <td>10 (37)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Government</td>
                  <td>3 (11)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Foundations or nonprofit organizations</td>
                  <td>4 (15)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Public health and health care</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref28">28</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Researcher or research center</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2"><bold>News</bold></td>
                  <td>5 (19)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Reputable news source</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Press, media, or news</td>
                  <td>3 (11)</td>
                  <td>[<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref44">44</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Medical news source</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2"><bold>Personal accounts</bold></td>
                  <td>7 (26)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Personal accounts, everyday people, individuals</td>
                  <td>6 (22)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Personal accounts with industry ties</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref28">28</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Person: supporter</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref29">29</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Person: basic profile (no mention of e-cigarettes)</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref29">29</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Celebrity, public figures</td>
                  <td>3 (11)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Organic (human)</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref41">41</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">E-cigarette community movement</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2"><bold>Industry</bold></td>
                  <td>5 (19)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Industry: retailer or manufacturer</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Retailer or vendor</td>
                  <td>3 (11)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Tobacco company</td>
                  <td>2 (7)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td><break/></td>
                  <td>Industry: other (eg, vaping magazine, Web marketer)</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref29">29</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">For-profit organization</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref44">44</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Entity: general (eg, company, store, advocacy group)</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Nonperson (eg, musical band)</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref29">29</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Bots, automatic, fake</td>
                  <td>4 (15)</td>
                  <td>[<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Unclassified or other</td>
                  <td>5 (19)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref49">49</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>Profile photo</td>
                  <td colspan="2"><break/></td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Single person versus multiple people</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Gender (male, female, mixed group)</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Age (babies or children, high school or college, adult)</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Race (African American, white, Hispanic, Asian, undetermined)</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                </tr>
                <tr valign="top">
                  <td>Location of user</td>
                  <td colspan="2"><break/></td>
                  <td>4 (15)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref37">37</xref>-<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">City, state, and country</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">State</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref8">8</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Country</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                </tr>
                <tr valign="top">
                  <td><break/></td>
                  <td colspan="2">Continent</td>
                  <td>1 (4)</td>
                  <td>[<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table4fn1">
                <p><sup>a</sup>Percentages are rounded to the nearest whole percent.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Overview</title>
        <p>Studies analyzing tobacco-related Twitter data have grown in number in recent years. Although we searched for articles published from 2006 to 2016, articles meeting inclusion criteria for this review were published from 2011 to 2016, with 85% (23/27) of the publications occurring in 2014-2016. Widely used among adolescents and black and Hispanic individuals, Twitter could provide a rich source of tobacco-related data among these groups. One of the benefits of Twitter research is the ability to focus on emerging issues and products that are not yet addressed in surveillance or epidemiological research. Collecting tobacco data in real time via Twitter could be a useful tool for tobacco surveillance, which could help inform tobacco control policies and social media campaigns.</p>
      </sec>
      <sec>
        <title>Data Collection Methods</title>
        <p>Twitter data can change rapidly as they are being posted daily [<xref ref-type="bibr" rid="ref37">37</xref>]. If a study only collects data from one point in time, it may not be reflective of data at any other point in time. Twitter studies should consider collecting data at multiple time points or over longer periods of time to decrease the likelihood that results are idiosyncratic to that point in time. However, there may be some research questions that only require sampling one time or sampling directly before and after an event to gauge short-term responses.</p>
        <p>The primary sources of data were Gnip and Twitter’s Streaming API, which offer different strengths and weaknesses. If a study wants access to all tobacco-related tweets, then Gnip may be more effective. However, if a study is interested in tweets about a specific tobacco campaign or has a constrained budget, then Twitter’s Streaming API may be a better data source. Alternatively, if a study is focusing on multiple social media sites (eg, Twitter, Facebook), then using Radian6, Simply Measured, or Sysomos Heartbeat may be appealing because of their cross-platform analysis.</p>
        <p>The results of this review suggest that there are some gaps in the types of tobacco products studied by Twitter analyses. E-cigarettes were the product that was addressed by most studies, while none of the studies focused on smokeless tobacco, snus, bidis, or kreteks. The focus on e-cigarettes over other products could be due in part to their recent rise in popularity and recent debates about policies. From 2011 to 2014, e-cigarette use among high school students in the United States significantly increased from 1.5% to 13.4% [<xref ref-type="bibr" rid="ref53">53</xref>]. Similarly, there was a significant increase in hookah use from 4.1% to 9.4%. However, there were significant decreases for cigarette (15.8% to 9.2%), snus (2.9% to 1.9%), cigar (11.6% to 8.2%), pipe (4.0% to 1.5%), and bidi (2.0% to 0.9%) use [<xref ref-type="bibr" rid="ref53">53</xref>]. It could be useful to conduct studies comparing tweets about cigarettes, e-cigarettes, and hookah among adolescents to help understand the changing rates of use and Twitter postings that discuss issues related to use. The rates of e-cigarette, hookah, and cigar use among high school students may be affected by the FDA regulations of these products that went into effect on August 8, 2016. One of the provisions of these regulations is that it will be illegal to sell e-cigarettes, cigars, and hookah tobacco to persons younger than 18 years [<xref ref-type="bibr" rid="ref54">54</xref>]. Researchers may want to analyze e-cigarette, cigar, and hookah tweets before and after August 8, 2016, to gain real-time insight into adolescents’ reactions to the new regulations.</p>
        <p>Future Twitter studies could benefit from a standard of reporting data collection methods. Only 4 of the articles in this review reported such rigorous methods of selecting their search keywords as suggested by Kim and colleagues’ [<xref ref-type="bibr" rid="ref11">11</xref>] search filter framework, while 15 articles reported retrieval precision and 4 reported retrieval recall. The terminology around newer products such as e-cigarettes is growing, so it may be difficult to capture all relevant Twitter conversations with one’s keywords [<xref ref-type="bibr" rid="ref25">25</xref>]. Future studies will need to continue to refine and expand search keywords.</p>
      </sec>
      <sec>
        <title>Data Coding</title>
        <p>The methods of coding were hand-coding, machine learning, or a combination of the two. Machine learning can code larger quantities of data at a quicker rate than hand-coding, but human coders may have greater discretion at coding for the complexities and subtlety of language such as humor, irony, or sarcasm. For example, algorithms developed to detect irony only retrieved 54%-57% of tweets coded as irony by multiple independent human coders [<xref ref-type="bibr" rid="ref55">55</xref>]. Hand-coding can be subject to bias, but creating coding schemes based on prior literature and working to achieve acceptable levels of interrater reliability can help attenuate individual bias. Hand-coding allows researchers to follow URLs, which can change the meaning of the tweet. Viewing the webpage may provide additional information that may not be discernable from the URL. Studies that require determining subtle differences in context may be better suited to hand-coding a small sample of Twitter data, while studies that rely less on context could code large samples with machine learning.</p>
      </sec>
      <sec>
        <title>Coded Categories</title>
        <p>The sentiment of tweets could help evaluate whether the responses to pro- and antitobacco efforts are positive or negative as a way of understanding social norms about these products. Clarity and comparability across studies could be improved if a distinction is made between attitude and emotion when coding for sentiment. For example, a tweet could be pro-vaping but have a negative emotional tone or it could be anti-vaping but have a positive tone. Only 1 article clarified the meaning by making an explicit distinction between coding for emotional sentiment and message attitude [<xref ref-type="bibr" rid="ref28">28</xref>]. This is reflective of coding for stance (in favor of, against, or neutral) versus sentiment (emotional tone) [<xref ref-type="bibr" rid="ref56">56</xref>].</p>
        <p>The three most common themes used for coding were advertisements or marketing; health, safety, harms; and use. Surveillance of these themes could be beneficial to understand whether tobacco advertisements are being circulated on Twitter with the potential of reaching underage individuals, whether the content is making unproven claims about the health and safety of their products, or promoting the use of their products to vulnerable populations such as youth or ethnic minorities.</p>
        <p>The most common user account descriptions that the studies coded for were personal accounts, industry, news, unclassified, and bots. Determining the user description and demographic information for the accounts that tweet about tobacco could help determine whether tobacco companies, pro-vaping advocacy groups, or antitobacco efforts are circulating with a potential to reach certain groups (eg, adolescents). Researchers could also monitor how news organizations are presenting tobacco-related information to the public.</p>
        <p>It may be difficult to determine the demographics of the person tweeting or of the audience exposed to the tweets, which could be especially problematic when studies want to focus on vulnerable populations (eg, adolescents). A Twitter account could be run by an individual, multiple people (eg, vape shop employees), or bots. To reduce bias, bots should be identified and the tweets from these accounts removed from analysis or identified as tweets originating from automated accounts [<xref ref-type="bibr" rid="ref57">57</xref>]. Only 4 studies coded for bots with a range from 6.9% to 80.7% of tweets classified as bots. Even if an account is run by an individual, a Twitter profile provides little information. It may or may not include a photograph, profile description, location, website, and birthday. It does not include gender or ethnicity and race, so this information needs to be estimated. Although none of the studies reported the percentage of tweets with accounts missing profile information, 5 studies coded for an unclassified category with 0.2%-38% of tweets being unable to be classified based on the account profile. If profile information is included, it could be used in combination with natural language processing to infer information about the individual from his or her tweets [<xref ref-type="bibr" rid="ref29">29</xref>]. For example, algorithms have estimated gender with a 75.5% accuracy based on tweets and a 92.0% accuracy based on tweets, screen name, full name, and profile description [<xref ref-type="bibr" rid="ref58">58</xref>]. A study that combined analysis of text and image processing predicted gender with an accuracy of 85.1% [<xref ref-type="bibr" rid="ref59">59</xref>]. Additionally, algorithms based on tweets were capable of predicting the exact age of the user within a margin of 4 years, while accuracy for age categories were 93.0% for &#60;20 years, 67.4% for 20-40 years, and 81.6 for &#62;40 years [<xref ref-type="bibr" rid="ref60">60</xref>].</p>
      </sec>
      <sec>
        <title>Recommendations</title>
        <p>It is recommended that tobacco Twitter studies adopt methodological standards of reporting and data quality assessment. Important information to consider reporting include data sources (eg, Gnip, Twitter’s Streaming API), the date range of tweets collected, the number of tweets coded, whether retweets were coded, whether coders followed URLs, whether images were coded, the categories coded, the decision criteria for each category, the number of unique Twitter accounts, and the types of Twitter accounts. Studies that use hand-coding should also consider reporting the number of independent coders, the number of tweets coded across coders, and their coding agreement, while it is important for machine learning studies to detail the development and refinement of their algorithms. Providing this information is likely to increase comparability across studies and the ability to replicate results.</p>
        <p>Depending on research goals, studies may want to sample Twitter’s databases multiple times, especially if they collect from Twitter’s Search API or Streaming API, which put limitations on the amount of data that can be collected per sample. Sampling at multiple times is also important for studies that have access to Twitter’s Firehose through Gnip, considering that tweets are in real time, which could lead to fluctuations based on real-world events (eg, the FDA’s new regulations for e-cigarettes). Following messages over time could also help establish trends in the content of posts. However, some studies may be interested in short-term reactions to an event, which requires different sampling methods than following trends. For example, if a study is interested in short-term reactions to the FDA’s new regulations for e-cigarettes, then a single sample before and after the implementation of the new regulations could be sufficient.</p>
        <p>When coding for sentiment, researchers could improve clarity by making a distinction between whether they are coding for message attitude or for emotional tone [<xref ref-type="bibr" rid="ref28">28</xref>]. A clear distinction between the two could improve comparability of sentiment ratings across studies.</p>
        <p>If relevant to the research questions, Twitter studies may want to code images and URLs. This added step can be time-consuming, but doing so could change the context or meaning of a tweet. For example, an image could help determine if a tweet should be coded as humor or sarcasm, while following a URL could help determine if the tweet is an advertisement. Failing to code images and URLs could result in missing significant content that could affect coding accuracy and skew results.</p>
        <p>Analyzing Twitter user profiles could provide context for tweets. The same pro–e-cigarette tweet could hold very different significance for a study’s results if it is from a vape shop versus an adolescent. However, the limitations of analyzing user profiles should be recognized and steps taken to improve accuracy. It should be noted that user profiles may be misleading (eg, a tobacco industry representative posing as an unaffiliated citizen) or profiles of bots. Bots should be identified and potentially removed to reduce bias and improve the quality of data [<xref ref-type="bibr" rid="ref57">57</xref>]. We cannot assume that the analysis is describing individuals but must instead consider the poster to be an “account” rather than a person.</p>
        <p>A limitation of Twitter data is that it does not provide much information on the effects of tweets on behavior. For example, tweeting about tobacco use does not necessarily mean that the person tweeting uses tobacco [<xref ref-type="bibr" rid="ref40">40</xref>]. Additionally, an individual may tweet about a quit smoking campaign with positive sentiment, but that does not mean that the campaign has influenced his or her smoking behavior. Follow-up studies with the individuals tweeting about the campaign would need to be conducted. None of the studies in the review included follow-up survey studies with individuals from their Twitter sample. Although recruitment of individuals through Twitter may come with its own set of obstacles, this could be an avenue for future Twitter research. Following specific individuals over time could allow for the analysis of changes in message content.</p>
      </sec>
      <sec>
        <title>Review Limitations</title>
        <p>There are several limitations of this systematic review. First, the results are limited to the databases and search keywords selected, which could have resulted in incomplete retrieval of identified research. Second, this review is limited to its inclusion criteria and the decision rules of the single, independent coder who selected the articles and extracted the data to be included in the review. Individual bias was limited by explicit inclusion, exclusion, and data extraction criteria. However, some studies that were included or excluded for this review may have varied given different inclusion criteria or a different coder. Finally, this review is limited to methodology of categorically coded tobacco Twitter data. Different methodological results and recommendations may have been made if the topic of Twitter data had been different (eg, marijuana) or if the review had focused on different outcomes (eg, popularity of tweets or diffusion of tweets).</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Categorically coded Twitter research can be used for certain insights that other survey research does not provide: emerging issues, popular content in real time, changes over time, how tobacco companies and pro-vaping advocacy groups use social media to increase message exposure in the population (eg, youth who might otherwise be protected from tobacco marketing), how tobacco control policies and campaigns can most effectively use social media, arguments by groups that may be incorporated into media message design, and quick reactions to antitobacco media campaigns and regulations. There are several approaches that researchers are taking to this end, each having its own set of strengths and weaknesses. Standards for data collection and coding should be developed to more easily compare and replicate tobacco-related Twitter results. Additional recommendations, dependent on one’s research goals, include the following: sample Twitter’s databases multiple times, make a distinction between message attitude and emotional tone for sentiment, code images and URLs, analyze user profiles, and identify and remove bots.</p>
      </sec>
    </sec>
  </body>
  <back>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">FDA</term>
          <def>
            <p>US Food and Drug Administration</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by the National Cancer Institute grant number T32CA009492-29 and the USC (University of Southern California) Tobacco Center of Regulatory Science for Vulnerable Populations grant number 3P50CA180905-04S1.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>BAL planned the review, conducted the literature search, synthesized the results, and wrote the manuscript. JBU, TBC, and KC assisted in the conceptualization of the review and edited the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
        <source>Twitter</source>  
        <year>2016</year>  
        <month>06</month>  
        <day>30</day>  
        <access-date>2016-11-17</access-date>
        <comment>Twitter Usage/Company Facts 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://about.twitter.com/company">https://about.twitter.com/company</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7ZjJlHW"/></comment> </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
        <source>Twitter</source>  
        <year>2016</year>  
        <access-date>2016-11-17</access-date>
        <comment>Truth Initiative Twitter account 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://twitter.com/truthinitiative">https://twitter.com/truthinitiative</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7a6uQ5G"/></comment> </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
        <source>Twitter</source>  
        <year>2016</year>  
        <access-date>2016-11-17</access-date>
        <comment>Blu Twitter account 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://twitter.com/blucigs">https://twitter.com/blucigs</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7aH0aG7"/></comment> </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
        <source>Still Blowing Smoke</source>  
        <year>2016</year>  
        <access-date>2016-11-17</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://stillblowingsmoke.org/">http://stillblowingsmoke.org/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6m7aTK5La"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="web">
        <source>Not Blowing Smoke</source>  
        <year>2016</year>  
        <access-date>2016-11-17</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://notblowingsmoke.org/">http://notblowingsmoke.org/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6m7bVdDlq"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
        <source>Twitter</source>  
        <year>2016</year>  
        <access-date>2016-11-17</access-date>
        <comment>Still Blowing Smoke account 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://twitter.com/stillblwngsmoke">https://twitter.com/stillblwngsmoke</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7bf3MPt"/></comment> </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
        <source>Twitter</source>  
        <year>2016</year>  
        <access-date>2016-11-17</access-date>
        <comment>Not Blowing Smoke account 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://twitter.com/notblwngsmoke">https://twitter.com/notblwngsmoke</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7bpA286"/></comment> </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Allem</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Escobedo</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Chu</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Soto</surname>
            <given-names>DW</given-names>
          </name>
          <name name-style="western">
            <surname>Cruz</surname>
            <given-names>TB</given-names>
          </name>
          <name name-style="western">
            <surname>Unger</surname>
            <given-names>JB</given-names>
          </name>
        </person-group>
        <article-title>Campaigns and counter campaigns: reactions on Twitter to e-cigarette education</article-title>
        <source>Tob Control</source>  
        <year>2016</year>  
        <month>03</month>  
        <day>8</day>  
        <fpage>1</fpage>  
        <lpage>4</lpage>  
        <pub-id pub-id-type="doi">10.1136/tobaccocontrol-2015-052757</pub-id>
        <pub-id pub-id-type="medline">26956467</pub-id>
        <pub-id pub-id-type="pii">tobaccocontrol-2015-052757</pub-id>
        <pub-id pub-id-type="pmcid">PMC5018457</pub-id></nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lenhart</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <source>Pew Research Center</source>  
        <year>2015</year>  
        <month>04</month>  
        <day>19</day>  
        <access-date>2016-11-18</access-date>
        <comment>Teen, Social Media and Technology Overview 2015 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/2015/04/09/teens-social-media-technology-2015">http://www.pewinternet.org/2015/04/09/teens-social-media-technology-2015</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7bxa9wU"/></comment> </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Duggan</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <source>Pew Research Center</source>  
        <year>2015</year>  
        <month>08</month>  
        <day>19</day>  
        <access-date>2016-11-18</access-date>
        <comment>Mobile Messaging and Social Media - 2015 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/2015/08/19/mobile-messaging-and-social-media-2015/">http://www.pewinternet.org/2015/08/19/mobile-messaging-and-social-media-2015/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7cE9B8E"/></comment> </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Emery</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Garbage in, Garbage Out: Data Collection, Quality Assessment and Reporting Standards for Social Media Data Use in Health Research, Infodemiology and Digital Disease Detection</article-title>
        <source>J Med Internet Res</source>  
        <year>2016</year>  
        <month>02</month>  
        <day>26</day>  
        <volume>18</volume>  
        <issue>2</issue>  
        <fpage>e41</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2016/2/e41/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.4738</pub-id>
        <pub-id pub-id-type="medline">26920122</pub-id>
        <pub-id pub-id-type="pii">v18i2e41</pub-id>
        <pub-id pub-id-type="pmcid">PMC4788740</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>O'Connor</surname>
            <given-names>RJ</given-names>
          </name>
        </person-group>
        <article-title>Non-cigarette tobacco products: what have we learnt and where are we headed?</article-title>
        <source>Tob Control</source>  
        <year>2012</year>  
        <month>03</month>  
        <volume>21</volume>  
        <issue>2</issue>  
        <fpage>181</fpage>  
        <lpage>90</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22345243"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/tobaccocontrol-2011-050281</pub-id>
        <pub-id pub-id-type="medline">22345243</pub-id>
        <pub-id pub-id-type="pii">tobaccocontrol-2011-050281</pub-id>
        <pub-id pub-id-type="pmcid">PMC3716250</pub-id></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
        <source>US Food and Drug Administration</source>  
        <year>2016</year>  
        <month>05</month>  
        <day>05</day>  
        <access-date>2016-11-17</access-date>
        <comment>Recognize tobacco in its many forms 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.fda.gov/ForConsumers/ConsumerUpdates/ucm392735.htm">http://www.fda.gov/ForConsumers/ConsumerUpdates/ucm392735.htm</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7cRBDCk"/></comment> </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
        <source>Twitter</source>  
        <year>2016</year>  
        <access-date>2016-11-17</access-date>
        <comment>Public API: GET statuses/user_timeline 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://dev.twitter.com/rest/reference/get/statuses/user_timeline">https://dev.twitter.com/rest/reference/get/statuses/user_timeline</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7ccAB9K"/></comment> </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="web">
        <source>Twitter</source>  
        <year>2016</year>  
        <access-date>2016-11-17</access-date>
        <comment>Public API: The Search API 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://dev.twitter.com/rest/public/search">https://dev.twitter.com/rest/public/search</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7dVm3hE"/></comment> </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="web">
        <source>R-project</source>  
        <year>2015</year>  
        <month>07</month>  
        <day>29</day>  
        <access-date>2016-11-16</access-date>
        <comment>twitteR: R Based Twitter Client 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/twitteR/index.html">https://cran.r-project.org/web/packages/twitteR/index.html</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7dfGPAu"/></comment> </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
        <source>QSR International</source>  
        <year>2015</year>  
        <month>07</month>  
        <day>07</day>  
        <access-date>2016-11-18</access-date>
        <comment>What is NCapture? 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.qsrinternational.com/support/faqs/what-is-ncapture">http://www.qsrinternational.com/support/faqs/what-is-ncapture</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7dqDJge"/></comment> </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>Social Media Research Foundation</collab>
        </person-group>
        <source>Social Network Importer for NodeXL</source>  
        <year>2015</year>  
        <month>03</month>  
        <day>21</day>  
        <access-date>2016-11-17</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://socialnetimporter.codeplex.com/">https://socialnetimporter.codeplex.com/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6m7dxDOHY"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
        <source>Twitter</source>  
        <year>2016</year>  
        <access-date>2016-11-17</access-date>
        <comment>The Streaming APIs 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://dev.twitter.com/streaming/overview">https://dev.twitter.com/streaming/overview</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7e9SDuI"/></comment> </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
        <source>Twitonomy</source>  
        <year>2016</year>  
        <access-date>2016-11-17</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.twitonomy.com/">http://www.twitonomy.com/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6m7eGH8hl"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>Gnip Inc</collab>
        </person-group>
        <source>Gnip</source>  
        <year>2016</year>  
        <access-date>2016-11-18</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.gnip.com/">https://www.gnip.com/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6m7eNkJO2"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
        <source>Salesforce Marketing Cloud</source>  
        <year>2016</year>  
        <access-date>2016-11-18</access-date>
        <comment>Radian6 is now part of Salesforce Marketing Cloud 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.marketingcloud.com/products/social-media-marketing/radian6/">https://www.marketingcloud.com/products/social-media-marketing/radian6/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7eWXoMH"/></comment> </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>Simply Measured Inc</collab>
        </person-group>
        <source>Simply Measured</source>  
        <year>2016</year>  
        <access-date>2016-11-18</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://simplymeasured.com/">http://simplymeasured.com/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="6m7edX0IE"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
        <source>Sysomos Heartbeat</source>  
        <access-date>2016-11-18</access-date>
        <comment>Proactive Social Media Monitoring 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://sysomos.com/products/heartbeat">https://sysomos.com/products/heartbeat</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7erpt4U"/></comment> </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cole-Lewis</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Pugatch</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Sanders</surname>
            <given-names>A</given-names>
          </name>
        </person-group>
        <article-title>Social listening: a content analysis of e-cigarette discussions on Twitter</article-title>
        <source>J Med Internet Res</source>  
        <year>2015</year>  
        <volume>17</volume>  
        <fpage>e243</fpage>  
        <pub-id pub-id-type="doi">10.2196/jmir.4969</pub-id></nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>AE</given-names>
          </name>
          <name name-style="western">
            <surname>Hopper</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Simpson</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Nonnemaker</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Lieberman</surname>
            <given-names>AJ</given-names>
          </name>
          <name name-style="western">
            <surname>Hansen</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Guillory</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Porter</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Using twitter data to gain insights into e-cigarette marketing and locations of use: an infoveillance study</article-title>
        <source>J Med Internet Res</source>  
        <year>2015</year>  
        <month>11</month>  
        <volume>17</volume>  
        <issue>11</issue>  
        <fpage>e251</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2015/11/e251/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.4466</pub-id>
        <pub-id pub-id-type="medline">26545927</pub-id>
        <pub-id pub-id-type="pii">v17i11e251</pub-id>
        <pub-id pub-id-type="pmcid">PMC4642798</pub-id></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Myslín</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Zhu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Chapman</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Conway</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Using twitter to examine smoking behavior and perceptions of emerging tobacco products</article-title>
        <source>J Med Internet Res</source>  
        <year>2013</year>  
        <month>08</month>  
        <volume>15</volume>  
        <issue>8</issue>  
        <fpage>e174</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/8/e174/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.2534</pub-id>
        <pub-id pub-id-type="medline">23989137</pub-id>
        <pub-id pub-id-type="pii">v15i8e174</pub-id>
        <pub-id pub-id-type="pmcid">PMC3758063</pub-id></nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>van der Tempel</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Noormohamed</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Schwartz</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Norman</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Malas</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Zawertailo</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Vape, quit, tweet? electronic cigarettes and smoking cessation on twitter</article-title>
        <source>Int J Public Health</source>  
        <year>2016</year>  
        <month>03</month>  
        <volume>61</volume>  
        <issue>2</issue>  
        <fpage>249</fpage>  
        <lpage>56</lpage>  
        <pub-id pub-id-type="doi">10.1007/s00038-016-0791-2</pub-id>
        <pub-id pub-id-type="medline">26841895</pub-id>
        <pub-id pub-id-type="pii">10.1007/s00038-016-0791-2</pub-id></nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chu</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Unger</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Allem</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Pattarroyo</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Soto</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Cruz</surname>
            <given-names>TB</given-names>
          </name>
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>CC</given-names>
          </name>
        </person-group>
        <article-title>Diffusion of messages from an electronic cigarette brand to potential users through twitter</article-title>
        <source>PLoS One</source>  
        <year>2015</year>  
        <volume>10</volume>  
        <issue>12</issue>  
        <fpage>e0145387</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0145387"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0145387</pub-id>
        <pub-id pub-id-type="medline">26684746</pub-id>
        <pub-id pub-id-type="pii">PONE-D-15-34480</pub-id>
        <pub-id pub-id-type="pmcid">PMC4694088</pub-id></nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Krauss</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Sowles</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Moreno</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Hookah-related twitter chatter: a content analysis</article-title>
        <source>Prev Chronic Dis</source>  
        <year>2015</year>  
        <volume>12</volume>  
        <fpage>e121</fpage>  
        <pub-id pub-id-type="doi">10.5888/ped12.150140</pub-id></nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Jain</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Zhu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Conway</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Exploring consumer attitudes towards hookah, cigarettes, and cigars using twitter</article-title>
        <source>Tobacco Reg Sci</source>  
        <year>2015</year>  
        <month>10</month>  
        <day>01</day>  
        <volume>1</volume>  
        <issue>3</issue>  
        <fpage>198</fpage>  
        <lpage>203</lpage>  
        <pub-id pub-id-type="doi">10.18001/TRS.1.3.1</pub-id></nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Prier</surname>
            <given-names>KW</given-names>
          </name>
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>MS</given-names>
          </name>
          <name name-style="western">
            <surname>Giraud-Carrier</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Hanson</surname>
            <given-names>CL</given-names>
          </name>
        </person-group>
        <person-group person-group-type="editor">
          <name name-style="western">
            <surname>Salerno</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Identifying health-related topics on twitter: an exploration of tobacco-related tweets as a test topic</article-title>
        <source>Social Computing, Behavioral-Cultural Modeling and Prediction</source>  
        <year>2011</year>  
        <publisher-loc>Berlin, Heidelberg</publisher-loc>
        <publisher-name>Springer-Verlag</publisher-name>
        <fpage>18</fpage>  
        <lpage>25</lpage> </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Kornfield</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Szczypka</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Emery</surname>
            <given-names>SL</given-names>
          </name>
        </person-group>
        <article-title>A cross-sectional examination of marketing of electronic cigarettes on twitter</article-title>
        <source>Tob Control</source>  
        <year>2014</year>  
        <month>07</month>  
        <volume>23 Suppl 3</volume>  
        <fpage>iii26</fpage>  
        <lpage>30</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://tobaccocontrol.bmj.com/cgi/pmidlookup?view=long&#38;pmid=24935894"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/tobaccocontrol-2014-051551</pub-id>
        <pub-id pub-id-type="medline">24935894</pub-id>
        <pub-id pub-id-type="pii">tobaccocontrol-2014-051551</pub-id>
        <pub-id pub-id-type="pmcid">PMC4078681</pub-id></nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Jo</surname>
            <given-names>CL</given-names>
          </name>
          <name name-style="western">
            <surname>Kornfield</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Emery</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Ribisl</surname>
            <given-names>KM</given-names>
          </name>
        </person-group>
        <article-title>Price-related promotions for tobacco products on twitter</article-title>
        <source>Tob Control</source>  
        <year>2016</year>  
        <month>07</month>  
        <volume>25</volume>  
        <issue>4</issue>  
        <fpage>476</fpage>  
        <lpage>9</lpage>  
        <pub-id pub-id-type="doi">10.1136/tobaccocontrol-2015-052260</pub-id>
        <pub-id pub-id-type="medline">26130449</pub-id>
        <pub-id pub-id-type="pii">tobaccocontrol-2015-052260</pub-id></nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>van den Heerik</surname>
            <given-names>RAM</given-names>
          </name>
          <name name-style="western">
            <surname>van Hooijdonk</surname>
            <given-names>CMJ</given-names>
          </name>
          <name name-style="western">
            <surname>Burgers</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Steen</surname>
            <given-names>GJ</given-names>
          </name>
        </person-group>
        <article-title>“Smoking Is Sóóó ... Sandals and White Socks”: Co-creation of a Dutch anti-smoking campaign to change social norms</article-title>
        <source>Health Commun</source>  
        <year>2016</year>  
        <month>06</month>  
        <day>29</day>  
        <fpage>1</fpage>  
        <lpage>8</lpage>  
        <pub-id pub-id-type="doi">10.1080/10410236.2016.1168000</pub-id>
        <pub-id pub-id-type="medline">27355838</pub-id></nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Step</surname>
            <given-names>MM</given-names>
          </name>
          <name name-style="western">
            <surname>Bracken</surname>
            <given-names>CC</given-names>
          </name>
          <name name-style="western">
            <surname>Trapl</surname>
            <given-names>ES</given-names>
          </name>
          <name name-style="western">
            <surname>Flocke</surname>
            <given-names>SA</given-names>
          </name>
        </person-group>
        <article-title>User and content characteristics of public tweets referencing little cigars</article-title>
        <source>Am J Health Behav</source>  
        <year>2016</year>  
        <month>01</month>  
        <volume>40</volume>  
        <issue>1</issue>  
        <fpage>38</fpage>  
        <lpage>47</lpage>  
        <pub-id pub-id-type="doi">10.5993/AJHB.40.1.5</pub-id>
        <pub-id pub-id-type="medline">26685812</pub-id></nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>de Viron</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Suggs</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Brand</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Van Oven</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Communicating genetics and smoking through social media: are we there yet?</article-title>
        <source>J Med Internet Res</source>  
        <year>2013</year>  
        <month>09</month>  
        <day>09</day>  
        <volume>15</volume>  
        <issue>9</issue>  
        <fpage>e198</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/9/e198/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.2653</pub-id>
        <pub-id pub-id-type="medline">24018012</pub-id>
        <pub-id pub-id-type="pii">v15i9e198</pub-id>
        <pub-id pub-id-type="pmcid">PMC3785980</pub-id></nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Prochaska</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Pechmann</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Leonhardt</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Twitter = quitter? an analysis of twitter quit smoking social networks</article-title>
        <source>Tobacco Control</source>  
        <year>2012</year>  
        <volume>21</volume>  
        <fpage>447</fpage>  
        <lpage>9</lpage>  
        <pub-id pub-id-type="doi">10.1007/978-3-642-19656-0</pub-id></nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Harris</surname>
            <given-names>JK</given-names>
          </name>
          <name name-style="western">
            <surname>Moreland-Russell</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Choucair</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Mansour</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Staub</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Simmons</surname>
            <given-names>K</given-names>
          </name>
        </person-group>
        <article-title>Tweeting for and against public health policy: response to the Chicago Department of Public Health's electronic cigarette twitter campaign</article-title>
        <source>J Med Internet Res</source>  
        <year>2014</year>  
        <volume>16</volume>  
        <issue>10</issue>  
        <fpage>e238</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2014/10/e238/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.3622</pub-id>
        <pub-id pub-id-type="medline">25320863</pub-id>
        <pub-id pub-id-type="pii">v16i10e238</pub-id>
        <pub-id pub-id-type="pmcid">PMC4210950</pub-id></nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Aphinyanaphongs</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Lulejian</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Brown</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Bonneau</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Krebs</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <article-title>Text classificationfor automatic detection of e-cigarette use and use for smoking cessation from twitter: a feasibility pilot</article-title>
        <source>Pac Symp Biocomput</source>  
        <year>2016</year>  
        <volume>21</volume>  
        <fpage>480</fpage>  
        <lpage>91</lpage> </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Clark</surname>
            <given-names>EM</given-names>
          </name>
          <name name-style="western">
            <surname>Jones</surname>
            <given-names>CA</given-names>
          </name>
          <name name-style="western">
            <surname>Williams</surname>
            <given-names>JR</given-names>
          </name>
          <name name-style="western">
            <surname>Kurti</surname>
            <given-names>AN</given-names>
          </name>
          <name name-style="western">
            <surname>Norotsky</surname>
            <given-names>MC</given-names>
          </name>
          <name name-style="western">
            <surname>Danforth</surname>
            <given-names>CM</given-names>
          </name>
          <name name-style="western">
            <surname>Dodds</surname>
            <given-names>PS</given-names>
          </name>
        </person-group>
        <article-title>Vaporous marketing: uncovering pervasive electronic cigarette advertisements on twitter</article-title>
        <source>PLoS One</source>  
        <year>2016</year>  
        <month>7</month>  
        <volume>11</volume>  
        <issue>7</issue>  
        <fpage>e0157304</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0157304"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0157304</pub-id>
        <pub-id pub-id-type="medline">27410031</pub-id>
        <pub-id pub-id-type="pii">PONE-D-15-39861</pub-id>
        <pub-id pub-id-type="pmcid">PMC4943591</pub-id></nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kavuluru</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Sabbir</surname>
            <given-names>AK</given-names>
          </name>
        </person-group>
        <article-title>Toward automated e-cigarette surveillance: Spotting e-cigarette proponents on twitter</article-title>
        <source>J Biomed Inform</source>  
        <year>2016</year>  
        <month>06</month>  
        <volume>61</volume>  
        <fpage>19</fpage>  
        <lpage>26</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2016.03.006</pub-id>
        <pub-id pub-id-type="medline">26975599</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(16)00046-0</pub-id>
        <pub-id pub-id-type="pmcid">PMC4893981</pub-id></nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chu</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Unger</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Cruz</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>Electronic cigarettes on twitter - spreading the appeal of flavors</article-title>
        <source>Tob Regul Sci</source>  
        <year>2015</year>  
        <volume>1</volume>  
        <fpage>36</fpage>  
        <lpage>41</lpage>  
        <pub-id pub-id-type="doi">10.18001/TRS.1.1.4</pub-id></nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chung</surname>
            <given-names>JE</given-names>
          </name>
        </person-group>
        <article-title>A smoking cessation campaign on twitter: understanding the use of twitter and identifying major players in a health campaign</article-title>
        <source>J Health Commun</source>  
        <year>2016</year>  
        <month>05</month>  
        <volume>21</volume>  
        <issue>5</issue>  
        <fpage>517</fpage>  
        <lpage>26</lpage>  
        <pub-id pub-id-type="doi">10.1080/10810730.2015.1103332</pub-id>
        <pub-id pub-id-type="medline">27115179</pub-id></nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cole-Lewis</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Varghese</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Sanders</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Schwarz</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Pugatch</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Augustson</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Assessing electronic cigarette-related tweets for sentiment and content using supervised machine learning</article-title>
        <source>J Med Internet Res</source>  
        <year>2015</year>  
        <month>08</month>  
        <day>25</day>  
        <volume>17</volume>  
        <issue>8</issue>  
        <fpage>e208</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2015/8/e208/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.4392</pub-id>
        <pub-id pub-id-type="medline">26307512</pub-id>
        <pub-id pub-id-type="pii">v17i8e208</pub-id>
        <pub-id pub-id-type="pmcid">PMC4642404</pub-id></nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Duke</surname>
            <given-names>JC</given-names>
          </name>
          <name name-style="western">
            <surname>Hansen</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>AE</given-names>
          </name>
          <name name-style="western">
            <surname>Curry</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Allen</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>The use of social media by state tobacco control programs to promote smoking cessation: a cross-sectional study</article-title>
        <source>J Med Internet Res</source>  
        <year>2014</year>  
        <month>07</month>  
        <volume>16</volume>  
        <issue>7</issue>  
        <fpage>e169</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2014/7/e169/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.3430</pub-id>
        <pub-id pub-id-type="medline">25014311</pub-id>
        <pub-id pub-id-type="pii">v16i7e169</pub-id>
        <pub-id pub-id-type="pmcid">PMC4115651</pub-id></nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Emery</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Szcyzpka</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>ABril</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Are you scared yet? evaluating fear appeal messages in tweets about the tips campaign</article-title>
        <source>J Commun</source>  
        <year>2014</year>  
        <volume>64</volume>  
        <fpage>278</fpage>  
        <lpage>95</lpage>  
        <pub-id pub-id-type="doi">10.1111/jcom.12083</pub-id></nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>McDaniel</surname>
            <given-names>PA</given-names>
          </name>
          <name name-style="western">
            <surname>Patzke</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Malone</surname>
            <given-names>RE</given-names>
          </name>
        </person-group>
        <article-title>Twitter users' reaction to a chain pharmacy's decision to end tobacco sales</article-title>
        <source>Tob Induc Dis</source>  
        <year>2015</year>  
        <volume>13</volume>  
        <fpage>36</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://tobaccoinduceddiseases.biomedcentral.com/articles/10.1186/s12971-015-0060-9"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/s12971-015-0060-9</pub-id>
        <pub-id pub-id-type="medline">26539069</pub-id>
        <pub-id pub-id-type="pii">60</pub-id>
        <pub-id pub-id-type="pmcid">PMC4632371</pub-id></nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Rocheleau</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Sadasivam</surname>
            <given-names>RS</given-names>
          </name>
          <name name-style="western">
            <surname>Baquis</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Stahl</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Kinney</surname>
            <given-names>RL</given-names>
          </name>
          <name name-style="western">
            <surname>Pagoto</surname>
            <given-names>SL</given-names>
          </name>
          <name name-style="western">
            <surname>Houston</surname>
            <given-names>TK</given-names>
          </name>
        </person-group>
        <article-title>An observational study of social and emotional support in smoking cessation Twitter accounts: content analysis of tweets</article-title>
        <source>J Med Internet Res</source>  
        <year>2015</year>  
        <volume>17</volume>  
        <issue>1</issue>  
        <fpage>e18</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2015/1/e18/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.3768</pub-id>
        <pub-id pub-id-type="medline">25589009</pub-id>
        <pub-id pub-id-type="pii">v17i1e18</pub-id>
        <pub-id pub-id-type="pmcid">PMC4319088</pub-id></nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Unger</surname>
            <given-names>JB</given-names>
          </name>
          <name name-style="western">
            <surname>Escobedo</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Allem</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Soto</surname>
            <given-names>DW</given-names>
          </name>
          <name name-style="western">
            <surname>Chu</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Cruz</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>Perceptions of secondhand e-cigarette aerosol among twitter users</article-title>
        <source>Tobacco Reg Sci</source>  
        <year>2016</year>  
        <month>04</month>  
        <day>01</day>  
        <volume>2</volume>  
        <issue>2</issue>  
        <fpage>146</fpage>  
        <lpage>52</lpage>  
        <pub-id pub-id-type="doi">10.18001/TRS.2.2.5</pub-id></nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Altman</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <source>Practical statistics for medical research</source>  
        <year>1991</year>  
        <publisher-loc>London</publisher-loc>
        <publisher-name>Chapman and Hall</publisher-name></nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>George</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Mallery</surname>
            <given-names>P</given-names>
          </name>
        </person-group>
        <source>SPSS for Windows step by step: A simple guide and reference. 11.0 update. 4th edition</source>  
        <year>2003</year>  
        <publisher-loc>Boston, MA</publisher-loc>
        <publisher-name>Allyn &#38; Bacon</publisher-name></nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="web">
        <source>Centers for Disease Control and Prevention</source>  
        <year>2015</year>  
        <month>04</month>  
        <day>17</day>  
        <access-date>2016-11-18</access-date>
        <comment>Morbidity and Mortality Weekly Report: Tobacco use among middle and high school students: United States, 2011-2014 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.cdc.gov/mmwr/preview/mmwrhtml/mm6414a3.htm">http://www.cdc.gov/mmwr/preview/mmwrhtml/mm6414a3.htm</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6m7f7VXzc"/></comment> </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="web">
        <source>US Food and Drug Administration</source>  
        <year>2016</year>  
        <month>11</month>  
        <day>28</day>  
        <access-date>2017-03-13</access-date>
        <comment>The Facts on the FDA's New Tobacco Rule 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.fda.gov/ForConsumers/ConsumerUpdates/ucm506676.htm">https://www.fda.gov/ForConsumers/ConsumerUpdates/ucm506676.htm</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6owhqygQ1"/></comment> </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Reyes</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Rosso</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Veale</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>A multidimensional approach for detecting irony in Twitter</article-title>
        <source>Lang Resources &#38; Evaluation</source>  
        <year>2012</year>  
        <month>7</month>  
        <day>24</day>  
        <volume>47</volume>  
        <issue>1</issue>  
        <fpage>239</fpage>  
        <lpage>68</lpage>  
        <pub-id pub-id-type="doi">10.1007/s10579-012-9196-x</pub-id></nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sobhani</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Mohammad</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Kiritchenko</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Detecting stance in tweets and analyzing its interaction with sentiment</article-title>
        <year>2016</year>  
        <conf-name>Proceedings of the Fifth Joint Conference on Lexical and Computational Semantics</conf-name>
        <conf-date>August 2016</conf-date>
        <conf-loc>Berlin, Germany</conf-loc>
        <fpage>159</fpage>  
        <lpage>169</lpage> </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Allem</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Ferrara</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>The importance of debiasing social media data to better understand e-cigarette-related attitudes and behaviors</article-title>
        <source>J Med Internet Res</source>  
        <year>2016</year>  
        <month>08</month>  
        <day>09</day>  
        <volume>18</volume>  
        <issue>8</issue>  
        <fpage>e219</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2016/8/e219/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.6185</pub-id>
        <pub-id pub-id-type="medline">27507563</pub-id>
        <pub-id pub-id-type="pii">v18i8e219</pub-id>
        <pub-id pub-id-type="pmcid">PMC5037931</pub-id></nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Burger</surname>
            <given-names>JD</given-names>
          </name>
          <name name-style="western">
            <surname>Henderson</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Zarrella</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Discriminating gender on Twitter</article-title>
        <year>2011</year>  
        <conf-name>Proceedings of the Conference on Empirical Methods in Natural Language Processing</conf-name>
        <conf-date>July 2011</conf-date>
        <conf-loc>Edinburgh, Scotland, UK</conf-loc></nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sakaki</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Miura</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Ma</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Hattori</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Ohkuma</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>Twitter user gender inferences using combined analysis of text and image processing</article-title>
        <year>2014</year>  
        <conf-name>Proceedings of the 25th International Conference on Computational Linguistics</conf-name>
        <conf-date>August 2014</conf-date>
        <conf-loc>Dublin, Ireland</conf-loc></nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Nguyen</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Gravel</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Trieschnigg</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Meder</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>“How old do you think I am?”: a study of language and age in twitter</article-title>
        <year>2013</year>  
        <conf-name>Proceedings of the Seventh International AAAI Conference on WeblogsSocial Media</conf-name>
        <conf-date>July 2013</conf-date>
        <conf-loc>Cambridge, MA</conf-loc></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
