<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">JMIR</journal-id>
            <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
            <journal-title>Journal of Medical Internet Research</journal-title>
            <issn pub-type="epub">1438-8871</issn>
            <publisher>
                <publisher-name>JMIR Publications Inc.</publisher-name>
                <publisher-loc>Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v17i6e138</article-id>
            <article-id pub-id-type="pmid">26048075</article-id>
            <article-id pub-id-type="doi">10.2196/jmir.4305</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Original Paper</subject>
                </subj-group>
                <subj-group subj-group-type="article-type">
                    <subject>Original Paper</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>A Scalable Framework to Detect Personal Health Mentions on Twitter</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="editor">
                    <name>
                        <surname>Eysenbach</surname>
                        <given-names>Gunther</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Bian</surname>
                        <given-names>Jian</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Nagar</surname>
                        <given-names>Ruchit</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1" equal-contrib="yes">
                    <name name-style="western">
                        <surname>Yin</surname>
                        <given-names>Zhijun</given-names>
                    </name>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-3075-1337</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib2">
                    <name name-style="western">
                        <surname>Fabbri</surname>
                        <given-names>Daniel</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <xref rid="aff2" ref-type="aff">2</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-0530-2510</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib3">
                    <name name-style="western">
                        <surname>Rosenbloom</surname>
                        <given-names>S Trent</given-names>
                    </name>
                    <degrees>MD, MPH</degrees>
                    <xref rid="aff2" ref-type="aff">2</xref>
                    <xref rid="aff3" ref-type="aff">3</xref>
                    <xref rid="aff4" ref-type="aff">4</xref>
                    <xref rid="aff5" ref-type="aff">5</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-7455-2260</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib4" corresp="yes">
                    <name name-style="western">
                        <surname>Malin</surname>
                        <given-names>Bradley</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <address>
                        <institution>Dept. of Electrical Engineering &#38; Computer Science</institution>
                        <institution>Vanderbilt University</institution>
                        <addr-line>Department of Biomedical Informatics, Vanderbilt University</addr-line>
                        <addr-line>2525 West End Avenue, Suite 1030</addr-line>
                        <addr-line>Nashville, TN, 37203</addr-line>
                        <country>United States</country>
                        <phone>1 615 343 9096</phone>
                        <fax>1 615 936 8545</fax>
                        <email>b.malin@vanderbilt.edu</email>
                    </address>
                    <xref rid="aff2" ref-type="aff">2</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-3040-5175</ext-link>
                </contrib>
            </contrib-group>
            <aff id="aff1">
                <sup>1</sup>
                <institution>Dept. of Electrical Engineering &#38; Computer Science</institution>
                <institution>Vanderbilt University</institution>
                <addr-line>Nashville, TN</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff2">
                <sup>2</sup>
                <institution>Dept. of Biomedical Informatics</institution>
                <institution>Vanderbilt University</institution>
                <addr-line>Nashville, TN</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff3">
                <sup>3</sup>
                <institution>Dept. of Medicine</institution>
                <institution>Vanderbilt Univerisity</institution>
                <addr-line>Nashville, TN</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff4">
                <sup>4</sup>
                <institution>School of Nursing</institution>
                <institution>Vanderbilt University</institution>
                <addr-line>Nashville, TN</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff5">
                <sup>5</sup>
                <institution>Dept. of Pediatrics</institution>
                <institution>Vanderbilt University</institution>
                <addr-line>Nashville, TN</addr-line>
                <country>United States</country>
            </aff>
            <author-notes>
                <corresp>Corresponding Author: Bradley Malin <email>b.malin@vanderbilt.edu</email>
                </corresp>
            </author-notes>
            <pub-date pub-type="collection">
                <month>06</month>
                <year>2015</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>05</day>
                <month>06</month>
                <year>2015</year>
            </pub-date>
            <volume>17</volume>
            <issue>6</issue>
            <elocation-id>e138</elocation-id>
            <!--history from ojs - api-xml-->
            <history>
                <date date-type="received">
                    <day>31</day>
                    <month>01</month>
                    <year>2015</year>
                </date>
                <date date-type="rev-request">
                    <day>19</day>
                    <month>02</month>
                    <year>2015</year>
                </date>
                <date date-type="rev-recd">
                    <day>08</day>
                    <month>03</month>
                    <year>2015</year>
                </date>
                <date date-type="accepted">
                    <day>23</day>
                    <month>03</month>
                    <year>2015</year>
                </date>
            </history>
            <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
            <copyright-statement>&#169;Zhijun Yin, Daniel Fabbri, S Trent Rosenbloom, Bradley Malin. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 05.06.2015. </copyright-statement>
            <copyright-year>2015</copyright-year>
            <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
                <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
            </license>
            <self-uri xlink:href="http://www.jmir.org/2015/6/e138/" xlink:type="simple" />
            <abstract>
                <sec sec-type="background">
                    <title>Background</title>
                    <p>Biomedical research has traditionally been conducted via surveys and the analysis of medical records. However, these resources are limited in their content, such that non-traditional domains (eg, online forums and social media) have an opportunity to supplement the view of an individual&#8217;s health.</p>
                </sec>
                <sec sec-type="objective">
                    <title>Objective</title>
                    <p>The objective of this study was to develop a scalable framework to detect personal health status mentions on Twitter and assess the extent to which such information is disclosed.</p>
                </sec>
                <sec sec-type="methods">
                    <title>Methods</title>
                    <p>We collected more than 250 million tweets via the Twitter streaming API over a 2-month period in 2014. The corpus was filtered down to approximately 250,000 tweets, stratified across 34 high-impact health issues, based on guidance from the Medical Expenditure Panel Survey. We created a labeled corpus of several thousand tweets via a survey, administered over Amazon Mechanical Turk, that documents when terms correspond to mentions of personal health issues or an alternative (eg, a metaphor). We engineered a scalable classifier for personal health mentions via feature selection and assessed its potential over the health issues. We further investigated the utility of the tweets by determining the extent to which Twitter users disclose personal health status.</p>
                </sec>
                <sec sec-type="results">
                    <title>Results</title>
                    <p>Our investigation yielded several notable findings. First, we find that tweets from a small subset of the health issues can train a scalable classifier to detect health mentions. Specifically, training on 2000 tweets from four health issues (cancer, depression, hypertension, and leukemia) yielded a classifier with precision of 0.77 on all 34 health issues. Second, Twitter users disclosed personal health status for all health issues. Notably, personal health status was disclosed over 50% of the time for 11 out of 34 (33%) investigated health issues. Third, the disclosure rate was dependent on the health issue in a statistically significant manner (<italic>P</italic>&#60;.001). For instance, more than 80% of the tweets about migraines (83/100) and allergies (85/100) communicated personal health status, while only around 10% of the tweets about obesity (13/100) and heart attack (12/100) did so. Fourth, the likelihood that people disclose their own versus other people&#8217;s health status was dependent on health issue in a statistically significant manner as well (<italic>P</italic>&#60;.001). For example, 69% (69/100) of the insomnia tweets disclosed the author&#8217;s status, while only 1% (1/100) disclosed another person&#8217;s status. By contrast, 1% (1/100) of the Down syndrome tweets disclosed the author&#8217;s status, while 21% (21/100) disclosed another person&#8217;s status.</p>
                </sec>
                <sec sec-type="conclusions">
                    <title>Conclusions</title>
                    <p>It is possible to automatically detect personal health status mentions on Twitter in a scalable manner. These mentions correspond to the health issues of the Twitter users themselves, but also other individuals. Though this study did not investigate the veracity of such statements, we anticipate such information may be useful in supplementing traditional health-related sources for research purposes.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>consumer health</kwd>
                <kwd>information retrieval</kwd>
                <kwd>machine learning</kwd>
                <kwd>social media</kwd>
                <kwd>twitter</kwd>
                <kwd>infodemiology</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title> Introduction</title>
            <sec>
                <title>Background</title>
                <p>Traditional methods for collecting data in support of clinical research include prospectively collected surveys (eg, [<xref ref-type="bibr" rid="ref1">1</xref>]), retrospective analyses of existing medical records (eg, [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]), and a combination of the two (eg, [<xref ref-type="bibr" rid="ref4">4</xref>]). Over the past decade, computerized methods for data collection have emerged, with traditional surveys for health research moving onto the Internet [<xref ref-type="bibr" rid="ref5">5</xref>] and increasingly widespread electronic medical records (EMRs) able to be mined to investigate a wide range of acute and longitudinal phenotypes [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. At the same time, these approaches tend to focus only on a medically centric worldview, and may provide only a partial view of a patient&#8217;s life. Recognizing this limitation, investigators have suggested that the data contributed through non-traditional domains, such as mobile apps [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>] and online forums where patients self-report on their status [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>], will provide a more complete view of an individual&#8217;s health and population-based health trends.</p>
                <p>An increasing number of studies demonstrate that the data disseminated via social media platforms, such as Twitter, can inform health-related investigations. We review such studies in the following section, but we highlight that studies have shown, for instance, that such data can be mined to model aggregate trends about health (eg, detection of statistically significant adverse effects of pharmaceuticals [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]). Recent investigations have also demonstrated that an individual&#8217;s health status can be corroborated by the statements they publish over social media platforms (eg, confirmation of flu diagnoses [<xref ref-type="bibr" rid="ref16">16</xref>]). Despite the power of such investigations, they are limited in that the associated approaches do not filter data from social media streams for any arbitrary health-related concept.</p>
            </sec>
            <sec>
                <title>Objective and Contribution</title>
                <p>The objective of our work is to develop a scalable framework for detecting mentions about personal health on a specific social media platform, namely Twitter. The system introduced in this paper is composed of several core processes. First, the system filters the Twitter stream for tweets that are likely to contain health-related information. Next, a subset of the tweets are labeled with respect to the type of information that is communicated (eg, health status of the author versus a metaphorical statement) and applied to train a classifier. While it is possible to label a large number of tweets given a substantial budget, it is unlikely that a classifier could be specialized for each specific health issue. For instance, imagine a researcher is interested in studying 10,000 distinct health issues, each of which will require at least 500 tweets to train a robust classifier. If the cost to label each tweet is $0.10, it would cost $500,000 to build the necessary corpora! Our framework demonstrates that a scalable classifier, which discovers health mentions across a broad range of health issues, can be composed by leveraging a mixture of tweets from various health issues, which could make large-scale investigations much more cost-effective. In doing so, however, our system is oriented toward a high precision while maintaining a reasonable recall.</p>
                <p>There are three primary contributions of this paper:</p>
                <list list-type="bullet">
                    <list-item>
                        <p>Labeled Health Mention Corpus. We leverage Amazon Mechanical Turk to create a labeled corpus of tweets with health mentions for 34 health issues. These include certain high impact health issues investigated in the Medical Expenditure Panel Survey [<xref ref-type="bibr" rid="ref17">17</xref>], such as arthritis, asthma, bronchitis, cancer, diabetes, hypertension, and stroke.</p>
                    </list-item>
                    <list-item>
                        <p>Health Mention Detection. We introduce a system to automatically detect personal health mentions in tweet streams. We show that this system is trainable with a relatively small number of labeled tweets from several health issues. Moreover, it can effectively detect personal health mentions across a range of health issues on Twitter. For instance, training on 2000 tweets associated with four health issues (cancer, depression, hypertension, and leukemia) can yield a classifier that achieves a precision of 0.77 on the aforementioned corpus of tweets of 34 health issues.</p>
                    </list-item>
                    <list-item>
                        <p>Health Mention Attribution. To demonstrate the potential for the data filtered from Twitter, we investigated how people reveal information about themselves and others. In doing so, we show that the likelihood an individual self-discloses is dependent on the health issues communicated. For example, personal health status is revealed more than 50% for 11 of the 34 health issues. For certain health issues (eg, allergies, bronchitis, insomnia, migraines, and ulcers), people are more likely to disclose their own health status, while for other health issues (eg, Alzheimer&#8217;s, Down syndrome, leukemia, miscarriage, and Parkinson&#8217;s), people are more likely to disclose another person&#8217;s status.</p>
                    </list-item>
                </list>
            </sec>
            <sec>
                <title>Prior Work</title>
                <sec>
                    <title>Social Media and Health Research</title>
                    <p>As alluded to, various investigations have demonstrated that social media can be successfully leveraged to (1) enable individuals to discuss their health status, (2) influence an individual&#8217;s health behavior, and (3) support the analysis of aggregate trends around health activities.</p>
                    <p>First, a certain portion of studies have focused on the extent to which, as well as how, social media enables self-reports of health information. Hale et al [<xref ref-type="bibr" rid="ref18">18</xref>] showed that users discuss their health conditions on public Facebook pages, but recognized that such pages tend to be overly general to attract users to contribute to a discussion. However, Bodnar and colleagues [<xref ref-type="bibr" rid="ref16">16</xref>] found that individuals who use social media discuss certain ailments with high accuracy on Twitter. Specifically, it was demonstrated that college students tend to talk about their influenza diagnosis and associated symptoms. More generally, Paul et al [<xref ref-type="bibr" rid="ref19">19</xref>] performed latent topic model discovery over self-reported health status in Twitter to detect complex and potentially novel phenotypes. It has further been shown, that some Twitter users reveal genome sequencing results (in relation to ancestry information according to 23andme.com services) over Twitter [<xref ref-type="bibr" rid="ref20">20</xref>].</p>
                    <p>Second, the previous investigations show that individuals publish information about themselves, but there is also a growing body of evidence to suggest that social media can influence an individual&#8217;s health behavior. In certain cases, exploitation of social media can bring about negative health behaviors. For instance, based on discussions about prescription abuse over Twitter, it was observed that social media may aggravate such problems [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. In a similar vein, a content analysis of tweets, in association with the demographics of the followers of marijuana Twitter handles, showed that social media may allure young people to establish substance use patterns. Wilson et al also argued that social media enables more individuals to be involved in an anti-vaccination movement [<xref ref-type="bibr" rid="ref23">23</xref>]. However, it was also shown that social media can encourage more positive changes in health behavior. Notably, it was shown that increasing communications with smokers on social media can promote free cessation services [<xref ref-type="bibr" rid="ref24">24</xref>]. Moreover, Cobb and colleagues [<xref ref-type="bibr" rid="ref25">25</xref>] developed a Facebook application that was able to track the significant elements of an intervention on smoke cessation. It was also found that the design and realization of a community opinion leader model may mitigate the spread of HIV [<xref ref-type="bibr" rid="ref26">26</xref>].</p>
                    <p>Third, social media can be mined to learn and characterize aggregate trends with respect to health activities. For instance, it was shown that flu trends can be effectively extracted from Twitter using standard machine learning strategies [<xref ref-type="bibr" rid="ref27">27</xref>]. More specifically, the analysis of daily tweets across a major metropolitan region (eg, New York) can enable the prediction of which health issues are currently influencing the health of the public [<xref ref-type="bibr" rid="ref28">28</xref>]. Meanwhile, Nagel et al [<xref ref-type="bibr" rid="ref29">29</xref>] showed that both the keywords chosen to filter and create subgroups of tweets affected prediction accuracy. Beyond health status, it has been illustrated that the rare or unknown side-effects of drugs can be discovered through sentiment analysis over Twitter [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
                    <p>Though social media can support a wide array of health-related investigations, there are a number of hurdles to making the associated methodologies scalable. As Curtis and colleagues [<xref ref-type="bibr" rid="ref30">30</xref>] point out, for instance, insufficient procedures for protecting participants&#8217; privacy was one of the challenges to recruiting members from social media to conduct HIV research. In addition, it was recently revealed that the unreliability of big data and continuous changes of search algorithms contributed to failures in the Google Flu Trends program [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
                    <p>Our work differs from the aforementioned studies in that we focus on personal health status disclosure on Twitter. We note that Mao et al [<xref ref-type="bibr" rid="ref32">32</xref>] discussed a similar topic, but their work is limited in that (1) it relied on regular expressions for classification, (2) focused on a limited number of health issues, and (3) examined whether personal health status is disclosed on status or conversation, but did not differentiate when heath status was disclosed for authors versus others. Lamb et al [<xref ref-type="bibr" rid="ref33">33</xref>] showed that a combination of tweets about infection with respect to both authors and others performed better than tweets about the authors alone when predicting flu trends, which lends credibility to our work. However, it should be noted that their classification only focused on a diagnosis of the flu instead of a broad range of health issues, as is addressed in our work.</p>
                </sec>
                <sec>
                    <title>Classification on Social Media</title>
                    <p>To mine health-related information from social media, it is critical to develop a classifier. However, tweets are constrained in size and, thus, are composed of limited content. Consequentially, it is essential to define and select discriminative features to support automated health status detection. In certain studies, tweets were enriched with features by referencing external sources, such as Wikipedia [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>], to improve topic modeling, but their generality hampers them in the support of personal health mention detection.</p>
                    <p>As an alternative, it has been shown that punctuation, emoji characters, hashtags, and the @username designation, as well as text (including n-grams of words or characters [<xref ref-type="bibr" rid="ref36">36</xref>]) from the webpage referenced by the URL in a tweet, can form meaningful features for classification purposes [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. Features generated using natural language processing tools, such as part of speech tags and dependencies between terms were also successfully incorporated as features in social media classifiers [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref39">39</xref>]. Building on previous studies, our work illustrates that nouns, verbs, pronouns, punctuation, emoji, hashtags, as well as dependencies, can serve as effective features for personal health mention.</p>
                </sec>
                <sec>
                    <title>Social Media Corpus Construction</title>
                    <p>If we rely on a classifier to filter and analyze social media, then it is essential to obtain (or create) a labeled corpus to train the classifier. Crowdsourcing over Web-based platforms, such as Amazon Mechanical Turk (MT), has been employed to generate labeled gold standard corpora [<xref ref-type="bibr" rid="ref37">37</xref>]. Notably, MT was leveraged to label when tweets were related to the health status of the author of a tweet in the latent topic modeling analysis discussed above [<xref ref-type="bibr" rid="ref19">19</xref>]. However, it should be recognized that the survey utilized by [<xref ref-type="bibr" rid="ref19">19</xref>] is limited in that it only related tweet content to the author and not another person&#8217;s health status.</p>
                </sec>
            </sec>
            <sec>
                <title>The Personal Health Status Mention Problem</title>
                <p>To formalize the problem, we define the notions of personal health status and mention: Definition 1 (Personal Health Status) is the health condition of a specific person regarding a health issue or symptom, and Definition 2 (Personal Health Mention) is a statement of personal health status in social media.</p>
                <p>These definitions focus on the health information of the individuals who are potentially identifiable. For instance, tweets such as &#8220;my father is cancer free for ten years&#8221;, &#8220;I have to do chemo tomorrow&#8221;, and &#8220;my little cousin has leukemia&#8221; are representatives of personal health mentions. By contrast, &#8220;Local charity doing great work to help cancer patients&#8221; is not a personal health mention because the subject is a group of people as opposed to a specific person.</p>
                <p>We treat the problem of personal health mention detection as binary classification. We say a tweet is positive if it reveals personal health status and negative otherwise. For example, two MT masters assigned positive labels to each of the first three tweets in <xref ref-type="table" rid="table1">Table 1</xref> (details in Method Section). Yet a term associated with a health issue can be uttered on Twitter for many other reasons, such as in a metaphorical sense, to express a viewpoint about a health issue in general, or to communicate a worry. The next three tweets in <xref ref-type="table" rid="table1">Table 1</xref> provide examples of these reasons respectively.</p>
                <p>Given their brevity (140 characters at most), tweets often have limited context. Consequentially, assigning a class label to a tweet is substantially more challenging than detecting if a given tweet communicates status of the author. The last three tweets in <xref ref-type="table" rid="table1">Table 1</xref> illustrates this observation, where MT masters assigned different option labels to the same tweet.</p>
                <p>In this paper, we study how people disclose personal health statuses on Twitter and present a scalable personal health mentions detection system for the Twitter stream. Specifically, we decompose this investigation into the following four hypotheses: H1: People discuss personal health status on Twitter; H2: Personal health status disclosure rate is health issue dependent; H3: The likelihood that people disclose their own versus other people&#8217;s personal health status is health issue dependent; and H4: Personal health status mention classifiers based on tweets of multiple health issues are more scalable than those based on a single health issue.</p>
                <table-wrap position="float" id="table1">
                    <label>Table 1</label>
                    <caption>
                        <p>Examples of tweets related to health issues and the labels obtained through the Mechanical Turk (MT) survey.</p>
                    </caption>
                    <table width="687" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="40" />
                        <col width="462" />
                        <col width="64" />
                        <col width="63" />
                        <thead>
                            <tr valign="top">
                                <td rowspan="2" colspan="2">Tweet</td>
                                <td colspan="2">Label via MT</td>
                            </tr>
                            <tr valign="top">
                                <td>Master 1</td>
                                <td>Master 2</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td colspan="4">
                                    <bold>Positive</bold>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>I&#8217;m suffering from schizophrenia and a little bit of insomnia.</td>
                                <td>author</td>
                                <td>author</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Prayers for my dad would be appreciated. He has lymphoma. Thanks for the support everyone.</td>
                                <td>relative</td>
                                <td>relative</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>didn&#8217;t she have a miscarriage like 3 days ago?</td>
                                <td>someone else</td>
                                <td>someone else</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="4">
                                    <bold>Negative</bold>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>you&#8217;re gonna give Viv a heart attack</td>
                                <td>metaphor</td>
                                <td>metaphor</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Even after Bill Gates relentless support and millions of dollars poured into Malaria research, we are not successful.</td>
                                <td>viewpoint</td>
                                <td>viewpoint</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Praying I don&#8217;t have pneumonia</td>
                                <td>worry</td>
                                <td>worry</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="4">
                                    <bold>Ambiguous</bold>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Cheerios say she&#8217;ll never have to worry about dieting. Too bad with 2:1 sodium to cal, she&#8217;ll have to worry about high blood pressure.</td>
                                <td>metaphor</td>
                                <td>someone else</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Yooo soo i walk out my apt and here this girl screaming for help. Apparently, she kneed her testicular cancer bf in the nuts repeatedly.</td>
                                <td>metaphor</td>
                                <td>someone else</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>memorial find. 10% of your bills went to leukemia and lymphoma research. when amber was around she brightened everyone&#8217;s day in one way.</td>
                                <td>viewpoint</td>
                                <td>someone else</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <sec>
                <title>System Pipeline</title>
                <p>
                    <xref ref-type="fig" rid="figure1">Figure 1</xref> provides a high-level summary of the system engineered to detect personal health mentions on Twitter. The system is composed of three primary components: (1) a filtering service (eg, a keyword filter based on health issues), (2) a labeling service, and (3) a health mention classification service. First, tweets collected via the Twitter streaming API are passed into a filter and stored in a bin indicative of a specific health issue. Next, a sample of the tweets associated with these health issues are sent to a labeling service (eg, MT). Once labeling is complete, a personal health mention classifier is trained and applied to report the probability that new incoming tweets correspond to such mentions.</p>
                <fig id="figure1" position="float">
                    <label>Figure 1</label>
                    <caption>
                        <p>Framework for personal health mention detection over Twitter. First, tweets are filtered into bins according to health issue topic. A portion of the tweets are supplied to a labeling service. The labeled data is then applied to train a classifier to detect personal health mentions.</p>
                    </caption>
                    <graphic xlink:href="jmir_v17i6e138_fig1.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Construction of a Health Mention Corpus</title>
                <p>To create a labeled corpus of health status mentions, we solicited annotators through MT. Specifically, we set up a survey for labeling a corpus on MT, the details of which are in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>. For each tweet, we directed two MT masters to select the best of seven options that describe how the tweet uses the health issue. These options represent the common usage of most health issues. We validated the reliability of the MT masters by illustrating that they exhibit high concordance in their labels (details in Tables A-2, A-3 in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>, and in <xref ref-type="app" rid="app2">Multimedia Appendix 2</xref>). <xref ref-type="fig" rid="figure2">Figure 2</xref> depicts how the options relate to the positive and negative labels.</p>
                <p>The positive class includes the labels of author, relative or friend, and someone else. The negative class consists of labels for metaphor, viewpoint, and worry. <xref ref-type="table" rid="table1">Table 1</xref> provides examples of tweets and the labels supplied by the MT masters. The last option label, N/A, which means none of the above, is also treated as a negative label in this investigation because it was observed (by the authors) that such labels were generally negative. For instance, these include tweets with job related information, which is spam that has nothing to do with a personal health mention.</p>
                <p>For the purposes of this study, we created four types of datasets. The formalization of the design of these datasets is available in Table B-1 in <xref ref-type="app" rid="app3">Multimedia Appendix 3</xref>. We refer to the first as the gold standard dataset. It consists of all tweets with labels agreeing at the positive (negative) level. This dataset represents an ideal case where readers can determine when a tweet communicates personal health status. For example, this dataset treats tweets as positive when labeled as author by one MT master and someone else by a second MT master. By contrast, this dataset discards tweets labeled as relative or friend and worry.</p>
                <p>Given the difficulty in labeling tweets in practice, we generated three additional datasets to resolve label conflicts. The first is the conflict as positive (CAP) dataset, which treats tweets with conflicting labels as positive. The second is the conflict as negative (CAN) dataset, which treats tweets with conflicting labels as negative. The third is the TieBreak dataset, which uses a third MT master to break the tie. These datasets represent the best case, the worst case, and the general case in the real world and we rely upon them to assess the system&#8217;s scalability.</p>
                <fig id="figure2" position="float">
                    <label>Figure 2</label>
                    <caption>
                        <p>Label hierarchy.</p>
                    </caption>
                    <graphic xlink:href="jmir_v17i6e138_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>System Classifier Evaluation Roadmap</title>
                <p>System scalability emphasizes the ability to detect mentions for many, potentially unknown, health issues communicated via social media, using the labeled tweets from a limited number of health issues.</p>
                <p>To formalize the scenario, let <italic>D</italic> be the set of health issues and <italic>X</italic> and <italic>Y</italic> be the set of health issues selected to train and test the classifier, respectively. By default, <italic>X, Y</italic> &#8838; <italic>D</italic>.</p>
                <p>As depicted in <xref ref-type="fig" rid="figure3">Figure 3</xref>, we assess two variations on classification. The first, which we refer to as homogeneous classification, corresponds to the traditional machine learning setting where a classifier is trained and tested on tweets from the same health issue. The second, which we refer to as heterogeneous classification, corresponds to when we train and test the classifier on tweets from disparate health issues. This type of scenario arises when a researcher attempts to reuse a classifier developed for one health issue on a different problem. <xref ref-type="fig" rid="figure3">Figure 3</xref> further illustrates two training strategies to scale the system in a real-world scenario: train the classifier on tweets from (1) one health issue, which results in homogeneous classification with &#124;<italic>X</italic>&#124; = 1 (HOC-1) and heterogeneous classification with &#124;<italic>X</italic>&#124; = 1 (HEC-1), and (2) many health issues, which results in homogeneous classification with &#124;<italic>X</italic>&#124; &#62; 1 (HOC-N) and heterogeneous classification with &#124;<italic>X</italic>&#124; &#62; 1 (HEC-N).</p>
                <p>The ideal scalability test is to train an HOC-1 classifier for every health issue in <italic>D</italic> with a sufficient quantity of labeled tweets. However, it is difficult to realize this scenario in practice because of limited budgets for gathering and annotating such corpora. As such, we performed a series of experiments to compare the performance of the various models (ie, HOC-1, HOC-N, HEC-1, and HEC-N) and leverage the best model to conduct scalability tests in a real-world scenario.</p>
                <fig id="figure3" position="float">
                    <label>Figure 3</label>
                    <caption>
                        <p>Overview of evaluation strategies for the personal health status mention classifier. Note, D={d1, d2, …, dn} is set of health issues, X is set of health issues selected to train classifier, and Y is set of health issues used to test classifier.</p>
                    </caption>
                    <graphic xlink:href="jmir_v17i6e138_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Performance Measures</title>
                <p>To assess the performance of the system, we rely upon the standard measures of precision and recall. In our setting, precision (P) corresponds to the proportion of tweets classified as positive that are in fact positive. Recall (R)corresponds to the fraction of real positive tweets that are classified as positive. Given the large volume of tweets and the often unbalanced positive/negative class ratio per health issue (see <xref ref-type="table" rid="table2">Table 2</xref> and <xref ref-type="fig" rid="figure4">Figure 4</xref>), we emphasize P while setting R to a reasonable level. Henceforth, we report the area under the PR curve (AUPRC) to evaluate how a classifier performs in general. We consider the PR curve, which can be more indicative of a classifier&#8217;s performance when the class ratio is highly imbalanced [<xref ref-type="bibr" rid="ref40">40</xref>]. To characterize general performance, we report on AUPRC when testing the scalability of the system.</p>
                <fig id="figure4" position="float">
                    <label>Figure 4</label>
                    <caption>
                        <p>The extent to which people tweet about themselves versus others when disclosing personal health status. Note that this is a stacked bar chart, such that the sum of the author and others proportions corresponds to the overall proportion of positive instances.</p>
                    </caption>
                    <graphic xlink:href="jmir_v17i6e138_fig4.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Health Status Classifier</title>
                <p>One of the aims in this research is to examine whether we can use classifiers trained with tweets from multiple health issues to detect personal health mentions about other health issues. Hence, it should be noted that the goal of our research is to examine the effectiveness of classifiers when supplied with a set of known (or off-the-shelf) features. We use a Multinomial Na&#239;ve Bayes (MNB) binary classifier based on four types of features associated with tweets. Alternatively, we can plug other learning algorithms, such as logistic regression or a support vector machine, into the framework as the base classifier. Previous investigations verified the effectiveness of such features [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref37">37</xref>-<xref ref-type="bibr" rid="ref39">39</xref>].</p>
                <list list-type="bullet">
                    <list-item>
                        <p>Nouns, verbs, and pronouns. We transformed each word into its lemma form. Though pronouns are often defined as stop terms (which are discarded in traditional natural language processing), they are retained because they can disclose the personal health status of a friend or family member (eg, &#8220;My mom makes having cancer look good&#8221;).</p>
                    </list-item>
                    <list-item>
                        <p>Dependencies. These are grammatical relations [<xref ref-type="bibr" rid="ref41">41</xref>] between words in a tweet, such that one of the words is a health issue. We replaced terms for health issues with the keyword diagnosis to compact the feature space. For example, the dependency (&#8220;dobj&#8221;, &#8220;have&#8221;, &#8220;cancer&#8221;) is converted into a feature that can be supplied to MNB, dobj_have_diagnosis.</p>
                    </list-item>
                    <list-item>
                        <p>Punctuation and Emoji. These can indicate an author&#8217;s emotion and may improve classification (e.g., &#8220;my uncle is cancer free !!!!!! lol&#8221;).</p>
                    </list-item>
                    <list-item>
                        <p>HTTP LINK, #hashtags, and @username. These features represent the existence of link, hashtag, and @username in a tweet, respectively.</p>
                    </list-item>
                </list>
            </sec>
            <sec>
                <title>Experiment Design</title>
                <sec>
                    <title>Overview</title>
                    <p>In our experiments, we highlight the evaluation of two important factors that can affect the scalability of a classifier: (1) the diversity of health issues in the training data, and (2) the quantity of training tweets. When we compare different classifiers, we focus on the former. When we test system scalability, beside the system scalability, we also evaluate the performance of the classifiers with different size of training dataset. The following provides details of the experiment design.</p>
                </sec>
                <sec>
                    <title>Dataset</title>
                    <p>We use the 34 health issues depicted in <xref ref-type="fig" rid="figure4">Figure 4</xref> to represent D and define a synthetic health issue, or SYND, as the union of cancer, depression, hypertension, and leukemia. We select cancer and leukemia, for which tweets are skewed toward communicating about other people&#8217;s health status, and depression and hypertension, for which tweets are skewed toward communicating about the author&#8217;s health status. We first applied the keywords (shown in Table D-1 in <xref ref-type="app" rid="app4">Multimedia Appendix 4</xref>), which were selected based on these health issues under the guidance of a clinical expert, to filter for tweets associated with the keywords. Then, we chose 1000 tweets, at random, for each of the four health issues to obtain the gold standard datasets. We also choose 100 tweets, at random, for each of health issue in D to generate gold standard, CAN, CAP and TieBreak datasets.</p>
                </sec>
                <sec>
                    <title>Comparison Between HOC-1 and HOC-N</title>
                    <p>We use the cancer, depression, hypertension, and leukemia gold standard datasets to train each homogeneous classifier. There are two situations where we can evaluate how the diversity of health issues in the training data influence the homogeneous classifiers. First, suppose that we aim to detect multiple health issues. Given a fixed number of training tweets, how does an HOC-N classifier (eg, trained with SYND) differ from a group of HOC-1 classifiers (eg, four HOC-1 classifiers)? Second, now imagine we wish to perform detection for only one single health issue (eg, cancer). Given a fixed number of training tweets, how does a HOC-N classifier (eg, trained with SYND and test on cancer) differ from the associated HOC-1 classifier (eg, cancer HOC-1 classifier)?</p>
                </sec>
                <sec>
                    <title>Comparison Between HEC-1 and HEC-N</title>
                    <p>To evaluate the diversity of health issues in training dataset, we compare HEC-1 with HEC-N (2 &#8804; &#124;<italic>X</italic>&#124; &#8804; 4). In particular, we use the cancer, depression, hypertension and leukemia gold standard datasets for training and the gold standard dataset of D  SYND to test all of the heterogeneous classifiers.</p>
                </sec>
                <sec>
                    <title>System Scalability Test</title>
                    <p>When assessing system scalability, we test the classifier on the CAN, CAP, and TieBreak datasets of D. This enables the evaluation of the performance of the system in a real-world scenario. We also test the classifier trained with different number of tweets.</p>
                </sec>
                <sec>
                    <title>Experimental Methodology</title>
                    <p>For each experiment, we stratify the tweets and generate 30 train-test sets. In doing so, (1) each set preserves the proportion of samples for each positive (negative) class, and (2) the data is partitioned, such that we train on 80% of the tweets while we test on the remaining 20%. To control the comparison, the size of the training set for each compared classifier is equivalent.</p>
                </sec>
            </sec>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <sec>
                <title>Dataset</title>
                <p>We used the Twitter streaming API to filter for tweets between May 7, 2014 and July 23, 2014 that were (1) published in the contiguous United States according to their geolocation, and (2) written in the English language only. A total of 261,468,446 tweets were subject to a filter composed of keywords for 34 health issues, resulting in 281,357 tweets (0.11%) for further investigation.</p>
            </sec>
            <sec>
                <title>How People Disclose Personal Health Status on Twitter</title>
                <p>To demonstrate the opportunities for a personal health mention detection system, we conducted an investigation to test H1, H2, and H3. We chose 100 tweets, at random, for each of the 34 health issues as shown along the x-axis of <xref ref-type="fig" rid="figure4">Figure 4</xref>, to generate the TieBreak dataset. These health issues are based on common and high impact health issues as defined by the Medical Expenditure Panel Survey [<xref ref-type="bibr" rid="ref17">17</xref>]. This figure illustrates how often people disclose their own health status as opposed to other individuals&#8217; status. The black bar, &#8220;About Author&#8221;, represents the proportion of positive tweets with the author label. The gray bar, &#8220;About Others&#8221;, represents the proportion of positive tweets with the label relative or friends and someone else. For a specific health issue, the sum of the two values is equal to the proportion of positive tweets for this health issue. For example, 40% of the tweets about miscarriages (40/100) disclosed other people&#8217;s status, while only 12% (12/100) disclosed the author&#8217;s status (such that 52%, 52/100, of the tweets were positive instances).</p>
                <p>To test hypothesis H2 (personal health status disclosure rate) and H3 (who the disclosure is about), we define the following null hypotheses: H2<sub>o</sub>: The rate of positive and negative tweets is independent of the health issues, and H3<sub>o</sub>: The rate of tweets disclosing the author&#8217;s health status and others&#8217; health status is independent of the health issues.</p>
                <p>To test these hypotheses, we used the TieBreak dataset, which (due to randomness) represents 100 samples from each of the 34 distributions regarding how people disclose health status. To test H2, we applied a chi-square test on these two variables: the number of positive tweets and the number of negative tweets in each health issue samples. To test hypothesis H3, we applied a Spearman correlation test on these two variables: the rate of tweets disclosing the author&#8217;s health status and the rate of tweets disclosing the others&#8217; health status. We set the alpha level of significance to .05.</p>
                <p>The results reveal several notable pieces of evidence, which are related to the first three hypotheses posed above.</p>
                <list list-type="bullet">
                    <list-item>
                        <p>People disclose personal health status on Twitter for a range of health issues (H1). The disclosure rate for each of the 34 health issues is greater than 9%. There are 29 health issues with disclosure rates greater than 20% and 11 health issues with disclosure rates greater than 50%. The latter group includes: allergies (85/100), anemia (57/100), arthritis (48/100), asthma (61/100), bronchitis (88/100), insomnia (70/100), kidney stones (67/100), migraines (83/100), miscarriages (52/100), pneumonia (68/100), thyroid (74/100) problems, and ulcers (56/100).</p>
                    </list-item>
                    <list-item>
                        <p>Health status disclosure rate is dependent on the health issue, &#967;<sup>2</sup>
                            <sub>33</sub>=697, <italic>P</italic>&#60;.001. For instance, more than 80% of the tweets about migraines (83/100) and allergies (85/100) communicate personal health status. By contrast, only &#8764;10% of tweets about obesity (13/100) and heart attacks (12/100) communicate personal health status. Bronchitis (88/100) exhibits the largest proportion of tweets that disclose personal health status, while smallpox (9/100) exhibits the smallest proportion.</p>
                    </list-item>
                    <list-item>
                        <p>The likelihood that people disclose their own versus other people&#8217;s health status is dependent on the health issue, <italic>Z</italic>=&#8722;5.745, <italic>P</italic>&#60;.001. For instance, 69% (69/100) of tweets about insomnia disclose the author&#8217;s personal health statuses compared, while only 1% (1/100) disclose another person&#8217;s status. By contrast, 1% (1/100) of the tweets for Down syndrome disclose the author&#8217;s status, while 21% (21/100) disclose another person&#8217;s status.</p>
                    </list-item>
                </list>
            </sec>
            <sec>
                <title>Classification Evaluation</title>
                <sec>
                    <title>Classification Data Set</title>
                    <p>We extracted the gold standard datasets for each of the four health issues mentioned in the Methods section. <xref ref-type="table" rid="table2">Table 2</xref> summarizes the number of tweets in each class. Except leukemia, which has a balanced positive and negative instance space, there were substantially more negative than positive tweets. Due to the definition of SYND, the number of positive and negative tweets of the synthetic health issue is the sum of the four health issues.</p>
                    <table-wrap position="float" id="table2">
                        <label>Table 2</label>
                        <caption>
                            <p>The number of positive and negative tweets in the gold standard datasets.</p>
                        </caption>
                        <table width="673" border="1" cellpadding="8" cellspacing="0" rules="groups" frame="hsides">
                            <col width="138" />
                            <col width="117" />
                            <col width="112" />
                            <col width="108" />
                            <col width="102" />
                            <col width="93" />
                            <thead>
                                <tr valign="bottom">
                                    <td>Tweet</td>
                                    <td>Cancer</td>
                                    <td>Depression</td>
                                    <td>Hypertension</td>
                                    <td>Leukemia</td>
                                    <td>SYND<sup>a</sup>
                                    </td>
                                </tr>
                            </thead>
                            <tbody>
                                <tr valign="top">
                                    <td>Positive</td>
                                    <td>166</td>
                                    <td>261</td>
                                    <td>211</td>
                                    <td>436</td>
                                    <td>1074</td>
                                </tr>
                                <tr valign="top">
                                    <td>Negative</td>
                                    <td>697</td>
                                    <td>461</td>
                                    <td>551</td>
                                    <td>423</td>
                                    <td>2132</td>
                                </tr>
                            </tbody>
                        </table>
                        <table-wrap-foot>
                            <fn id="table2fn1">
                                <p>
                                    <sup>a</sup>SYND: synthetic health issue (D).</p>
                            </fn>
                        </table-wrap-foot>
                    </table-wrap>
                </sec>
                <sec>
                    <title>Most Informative Features</title>
                    <p>Before conducting an in-depth empirical investigation, we inspected the classifiers and their corresponding features to determine if they are intuitive. Here, we report on the top 10 informative features by training in a homogeneous classification setting with tweets of each of the five health issues (cancer, depression, hypertension, leukemia, and SYND). <xref ref-type="table" rid="table3">Table 3</xref> reports these features for each classifier.</p>
                    <p>The results show the effectiveness of feature selection in several ways. First, more than five features are pronouns, such as I, my, and she (which was also confirmed in [<xref ref-type="bibr" rid="ref32">32</xref>]). These are stop words that are typically removed in the context of general text classification. However, in our scenario, they appear to signify users who disclose health information about themselves and others (eg, &#8220;my mom makes having cancer look easy&#8221;). Second, certain words, such as get, have, and battle, when applied in conjunction with a health issue, can disclose personal health status (eg, &#8220;my friend lost his battle to leukemia&#8221;). Third, dependencies, such as &#8220;obj_have_diagnosis&#8221;, are strong positive indicators (eg, &#8220;I have seasonal allergy&#8221;).</p>
                    <p>This table also provides several notable results about other behaviors when people disclose personal health status. For instance, people often include @someone in health mentions. They use links to provide additional information such as pictures, locations, or texts, or use exclamation mark to express strong feelings about personal health status.</p>
                    <p>The hypertension classifier was notable because it had specific health-related terminology ranked highly. Specifically, the term blood is highly informative for this classifier. We suspect this is because hypertension is commonly referred as high blood pressure.</p>
                    <table-wrap position="float" id="table3">
                        <label>Table 3</label>
                        <caption>
                            <p>The most informative features for homogeneous health mention classification.</p>
                        </caption>
                        <table width="673" border="1" cellpadding="8" cellspacing="0" rules="groups" frame="hsides">
                            <col width="42" />
                            <col width="136" />
                            <col width="129" />
                            <col width="143" />
                            <col width="86" />
                            <col width="135" />
                            <thead>
                                <tr valign="bottom">
                                    <td>Rank</td>
                                    <td>Cancer</td>
                                    <td>Depression</td>
                                    <td>Hypertension</td>
                                    <td>Leukemia</td>
                                    <td>SYND<sup>a</sup>
                                    </td>
                                </tr>
                            </thead>
                            <tbody>
                                <tr valign="top">
                                    <td>1</td>
                                    <td>I</td>
                                    <td>I</td>
                                    <td>I</td>
                                    <td>I</td>
                                    <td>I</td>
                                </tr>
                                <tr valign="top">
                                    <td>2</td>
                                    <td>my</td>
                                    <td>my</td>
                                    <td>my</td>
                                    <td>My</td>
                                    <td>My</td>
                                </tr>
                                <tr valign="top">
                                    <td>3</td>
                                    <td>!</td>
                                    <td />
                                    <td>have</td>
                                    <td />
                                    <td />
                                </tr>
                                <tr valign="top">
                                    <td>4</td>
                                    <td />
                                    <td>you</td>
                                    <td />
                                    <td>HTTP LINK</td>
                                    <td>!</td>
                                </tr>
                                <tr valign="top">
                                    <td>5</td>
                                    <td>you</td>
                                    <td>it</td>
                                    <td>dobj_have_diagnosis</td>
                                    <td>!</td>
                                    <td>Have</td>
                                </tr>
                                <tr valign="top">
                                    <td>6</td>
                                    <td>have</td>
                                    <td>go</td>
                                    <td>!</td>
                                    <td>She</td>
                                    <td>HTTP LINK</td>
                                </tr>
                                <tr valign="top">
                                    <td>7</td>
                                    <td>she</td>
                                    <td>poss_diagnosis_my</td>
                                    <td>get</td>
                                    <td>Have</td>
                                    <td>She</td>
                                </tr>
                                <tr valign="top">
                                    <td>8</td>
                                    <td>He</td>
                                    <td>!</td>
                                    <td>she</td>
                                    <td>He</td>
                                    <td>You</td>
                                </tr>
                                <tr valign="top">
                                    <td>9</td>
                                    <td>HTTP LINK</td>
                                    <td>get</td>
                                    <td>it</td>
                                    <td>Battle</td>
                                    <td>obj&#173;_have_diagnosis</td>
                                </tr>
                                <tr valign="top">
                                    <td>10</td>
                                    <td>obj_have_diagnosis</td>
                                    <td>have</td>
                                    <td>blood</td>
                                    <td>Help</td>
                                    <td>He</td>
                                </tr>
                            </tbody>
                        </table>
                        <table-wrap-foot>
                            <fn id="table3fn1">
                                <p>
                                    <sup>a</sup>SYND: synthetic health issue (D).</p>
                            </fn>
                        </table-wrap-foot>
                    </table-wrap>
                </sec>
                <sec>
                    <title>Homogeneous and Heterogeneous Classification</title>
                    <p>In this experiment, we compared the effectiveness of homogeneous and heterogeneous classifiers and then testing on tweets from each of the five health issues. <xref ref-type="table" rid="table4">Table 4</xref> provides the AUPRCs for each homogeneous (along the diagonal) and heterogeneous (off diagonal cells) health mention classifier. Each row corresponds to the health issue relied upon for training the classifier, while each column corresponds to the health issue the classifier was applied to. To test the significance, we ran a <italic>t</italic> test when the results followed a normal distribution and a Kolmogorov-Smirnov (KS) test otherwise.</p>
                    <p>First, it should be noted that each homogeneous classifier outperforms the heterogeneous classifiers when testing the corresponding health issue tweets, but such classifiers do not generalize. It can be seen that the leukemia HOC-1 classifier achieved the highest AUPRC. This may be due to the balance in the positive and negative classes for this health issue. However, it was observed that the homogeneous classifiers exhibited much higher variance compared to the heterogeneous classifiers. This suggests that heterogeneous classifiers may yield stable results.</p>
                    <p>Second, the HEC-1 classifier may tend to obtain a better AUPRC when testing on health issues with a similar author-to-others disclosure rate. For instance, cancer achieved the best AUPRC when testing on leukemia tweets. Meanwhile, leukemia achieved the best AUPRC when testing on cancer tweets. Depression and hypertension also achieved the best AUPRC when testing on each other.</p>
                    <p>Third, it also shows that SYND heterogeneous classifier (HEC-N) was the second best heterogeneous classifier when testing on cancer, depression, and leukemia tweets, and the best heterogeneous classifier when testing on hypertension. Considering that the HEC-1 classifier is specialized to a certain health issue, the HEC-N classifier may provide a more scalable alternative when filtering for personal health mentions on other health issues.</p>
                    <table-wrap position="float" id="table4">
                        <label>Table 4</label>
                        <caption>
                            <p>AUPRC for homogeneous and heterogeneous classifiers.<sup>a</sup>
                            </p>
                        </caption>
                        <table width="673" border="1" cellpadding="8" cellspacing="0" rules="groups" frame="hsides">
                            <col width="99" />
                            <col width="115" />
                            <col width="119" />
                            <col width="122" />
                            <col width="104" />
                            <col width="113" />
                            <thead>
                                <tr valign="top">
                                    <td rowspan="2">
                                        <break />
                                    </td>
                                    <td>Cancer</td>
                                    <td>Depression</td>
                                    <td>Hypertension</td>
                                    <td>Leukemia</td>
                                    <td>SYND</td>
                                </tr>
                                <tr valign="top">
                                    <td colspan="5">mean (SD)</td>
                                </tr>
                            </thead>
                            <tbody>
                                <tr valign="bottom">
                                    <td>Cancer</td>
                                    <td>0.732 (0.058)</td>
                                    <td>0.528 (0.018) <sup>b</sup>
                                    </td>
                                    <td>0.552 (0.014)<sup>b</sup>
                                    </td>
                                    <td>0.869 (0.009)<sup>b</sup>
                                    </td>
                                    <td>0.728 (0.009)<sup>b</sup>
                                    </td>
                                </tr>
                                <tr valign="bottom">
                                    <td>Depression</td>
                                    <td>0.441 (0.007)<sup>b</sup>
                                    </td>
                                    <td>0.663 (0.054)</td>
                                    <td>0.611 (0.014)<sup>b</sup>
                                    </td>
                                    <td>0.821 (0.006)<sup>b</sup>
                                    </td>
                                    <td>0.666 (0.006)<sup>b</sup>
                                    </td>
                                </tr>
                                <tr valign="bottom">
                                    <td>Hypertension</td>
                                    <td>0.451 (0.009)<sup>b</sup>
                                    </td>
                                    <td>0.646 (0.011)</td>
                                    <td>0.664 (0.062)</td>
                                    <td>0.726 (0.008)<sup>b</sup>
                                    </td>
                                    <td>0.616 (0.006)<sup>b</sup>
                                    </td>
                                </tr>
                                <tr valign="bottom">
                                    <td>Leukemia</td>
                                    <td>0.638 (0.011)<sup>b</sup>
                                    </td>
                                    <td>0.603 (0.011)<sup>b</sup>
                                    </td>
                                    <td>0.559 (0.019)<sup>e</sup>
                                    </td>
                                    <td>0.936 (0.019)</td>
                                    <td>0.579 (0.007)<sup>b</sup>
                                    </td>
                                </tr>
                                <tr valign="bottom">
                                    <td>SYND<sup>f</sup>
                                    </td>
                                    <td>0.625 (0.022)<sup>e</sup>
                                    </td>
                                    <td>0.618 (0.026)<sup>d</sup>
                                    </td>
                                    <td>0.626 (0.019)<sup>c</sup>
                                    </td>
                                    <td>0.831 (0.023)<sup>b</sup>
                                    </td>
                                    <td>0.820 (0.0180</td>
                                </tr>
                            </tbody>
                        </table>
                        <table-wrap-foot>
                            <fn id="table4fn1">
                                <p>
                                    <sup>a</sup> AUPRC: area under the precision recall curve. Classifiers were trained with row health issue tweets and tested on column health issue tweets. Within each column, a hypothesis test was conducted between HOC-1 and each model that is not HOC-1 (eg, HOC-1 vs HEC-1).</p>
                            </fn>
                            <fn id="table4fn2">
                                <p>
                                    <sup>b</sup>
                                    <italic>P</italic>&#60;.001</p>
                            </fn>
                            <fn id="table4fn3">
                                <p>
                                    <sup>c</sup>
                                    <italic>P</italic>=.002</p>
                            </fn>
                            <fn id="table4fn4">
                                <p>
                                    <sup>d</sup>
                                    <italic>P</italic>=.003</p>
                            </fn>
                            <fn id="table4fn5">
                                <p>
                                    <sup>e</sup>
                                    <italic>P</italic>=.004</p>
                            </fn>
                            <fn id="table4fn6">
                                <p>
                                    <sup>f</sup>SYND: synthetic health issue (D).</p>
                            </fn>
                        </table-wrap-foot>
                    </table-wrap>
                    <table-wrap position="float" id="table5">
                        <label>Table 5</label>
                        <caption>
                            <p>AUPRC of homogeneous health mention classifiers, given the same number of training tweets.<sup>a</sup>
                            </p>
                        </caption>
                        <table width="673" border="1" cellpadding="8" cellspacing="0" rules="groups" frame="hsides">
                            <col width="101" />
                            <col width="142" />
                            <col width="142" />
                            <col width="142" />
                            <col width="142" />
                            <thead>
                                <tr valign="top">
                                    <td rowspan="2">Classifier</td>
                                    <td>Cancer</td>
                                    <td>Depression</td>
                                    <td>Hypertension</td>
                                    <td>Leukemia</td>
                                </tr>
                                <tr valign="top">
                                    <td colspan="4">mean (SD)</td>
                                </tr>
                            </thead>
                            <tbody>
                                <tr valign="bottom">
                                    <td>HOC-1<sup>b</sup>
                                    </td>
                                    <td>0.732 (0.058)</td>
                                    <td>0.663 (0.054)</td>
                                    <td>0.664 (0.063)</td>
                                    <td>0.936 (0.019)</td>
                                </tr>
                                <tr valign="bottom">
                                    <td>HOC-N<sup>c</sup>
                                    </td>
                                    <td>0.723 (0.061)</td>
                                    <td>0.645 (0.053)</td>
                                    <td>0.672 (0.070)</td>
                                    <td>0.927 (0.022)</td>
                                </tr>
                                <tr valign="bottom">
                                    <td>HOC-N&#8225;</td>
                                    <td>0.756 (0.050)</td>
                                    <td>0.681 (0.050)</td>
                                    <td>0.702 (0.059)<sup>d</sup>
                                    </td>
                                    <td>0.940 (0.021)</td>
                                </tr>
                            </tbody>
                        </table>
                        <table-wrap-foot>
                            <fn id="table5fn1">
                                <p>
                                    <sup>a</sup>AUPRC: area under the precision recall curve. Within each column, the hypothesis test was conducted between HOC-1 and each model that is not HOC-1 (eg, HOC-1 vs HOC-N).</p>
                            </fn>
                            <fn id="table5fn2">
                                <p>
                                    <sup>b</sup>HOC-1: homogeneous classification with &#124;X&#124; = 1</p>
                            </fn>
                            <fn id="table5fn3">
                                <p>
                                    <sup>c</sup>HOC-N: homogeneous classification with &#124;X&#124; &#62; 1</p>
                            </fn>
                            <fn id="table5fn4">
                                <p>
                                    <sup>d</sup>
                                    <italic>P</italic>=.015</p>
                            </fn>
                        </table-wrap-foot>
                    </table-wrap>
                </sec>
                <sec>
                    <title>Comparison of Homogeneous Classifiers</title>
                    <p>In this experiment, we evaluated how homogeneous classifiers are influenced by (1) the number of health issues in the training set, and (2) the number of tweets used for training classifiers. <xref ref-type="table" rid="table5">Table 5</xref> shows the results for the HOC-1 and HOC-N classifiers when testing on the tweets of each health issue. For each column, we trained homogeneous classifiers HOC-1 and HOC-N with the same number of training tweets. The number of training tweets for HOC-N<sup>&#8225;</sup> classifier equaled to the number of all the tweets training for each HOC-1 classifier. HOC-N<sup>&#8225;</sup> is introduced to compare classifiers in a scenario often encountered in practice. For instance, imagine there is a fixed budget (eg, monetary quantity) through which we can only label 2000 tweets. If we have four HOC-1 classifiers, then we can only allocate 500 tweets to each. However, we can allocate all 2000 tweets to the HOC-N classifier. Again, we ran a <italic>t</italic> test when the results failed to followed a normal distribution and a KS-test otherwise.</p>
                    <p>The hypothesis tests showed that only the HOC-1 and HOC-N<sup>&#8225;</sup> classifiers are statistically significant when testing on hypertension tweets (<italic>P</italic>=.015). This suggests that HOC-N classifiers are expected to have similar performance with HOC-1 classifiers when each classifier is trained with the same number of training tweets. However, if the total number of training tweets is fixed, the HOC-N classifier will outperform the combination of HOC-1 classifiers.</p>
                    <p>This indicates that the HOC-N classifier can serve as a substitute for HOC-1 classifiers.</p>
                </sec>
                <sec>
                    <title>Comparison Between Heterogeneous Classifiers</title>
                    <p>In this experiment, we evaluated how the number of health issues in the training set influence the heterogeneous classifiers. <xref ref-type="fig" rid="figure5">Figure 5</xref> shows the results of HEC-1 and HEC-N (N &#8712; {2, 3, 4}) when testing on the other 30 health issues. For HEC-1, it should be noted that the cancer HEC-1 achieved the best AUPRC. This may stem from the fact that cancer can be invoked to communicate a wide variety of concepts beyond an individual&#8217;s health status, such as the Zodiac, the name of a physical building, or a metaphor. The results also indicate that HEC-N tends to outperform HEC-1.</p>
                    <p>This suggests hypothesis H4 may be true, provided the classifier is based on an appropriate mixture of health issues. However, determining an optimized group of health issues to achieve an HEC-N classifier with performance comparable to HEC-1 classifier is left to future investigation.</p>
                    <p>Based on these findings, we use HOC-N and HEC-N to conduct the system scalability test.</p>
                    <fig id="figure5" position="float">
                        <label>Figure 5</label>
                        <caption>
                            <p>Comparison Between heterogeneous classifiers HEC-1 and HEC-N trained on cancer, depression, hypertension, and leukemia, and tested on the remaining 30 health issues. The tweets of each test health issue stratified with respect to their rate of observation.</p>
                        </caption>
                        <graphic xlink:href="jmir_v17i6e138_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                </sec>
            </sec>
            <sec>
                <title>System Scalability</title>
                <p>After breaking ties, 43.7% of the TieBreak dataset are positive instances. Based on this proportion, there are approximately 120,260 positive instances out of 281,357 tweets in the health issue bins (or 0.046% of all the collected tweets). <xref ref-type="table" rid="table6">Table 6</xref> reports the distribution of positive and negative tweets in each dataset.</p>
                <p>We trained the SYND classifier with the gold standard datasets for cancer, depression, hypertension, and leukemia, and tested it on the other three types of datasets. <xref ref-type="fig" rid="figure6">Figure 6</xref> depicts the PR curves for each dataset and shows the average and standard deviation of AUPRC. The upper line corresponds to testing on the CAP dataset (AUPRC 0.753, SD 0.005), the middle line corresponds to testing on the TieBreak dataset (AUPRC 0.685, SD 0.005) and the lower line corresponds to testing on the CAP dataset (AUPRC 0.594, SD 0.007). When fixing the recall to 0.4, it was observed that the CAP, TieBreak, and CAN scenarios yield a precision of 0.8, 0.77, and 0.61, respectively. These results demonstrate the scalability of the system classifiers to obtain a high precision with a reasonable recall when testing many other health issues in the Twitter environment.</p>
                <p>
                    <xref ref-type="fig" rid="figure7">Figure 7</xref> shows how the size of the training set influences the AUPRC of the classifiers. For each training set, the mean AUPRC and a 95% confidence interval is illustrated in the gray area. For each dataset, the results suggest that AUPRC achieves stability when the training set consists of approximately 2000 tweets.</p>
                <table-wrap position="float" id="table6">
                    <label>Table 6</label>
                    <caption>
                        <p>Class distribution of tweets in the datasets.</p>
                    </caption>
                    <table width="673" border="1" cellpadding="8" cellspacing="0" rules="groups" frame="hsides">
                        <col width="164" />
                        <col width="111" />
                        <col width="129" />
                        <col width="120" />
                        <col width="147" />
                        <thead>
                            <tr valign="bottom">
                                <td>Tweets</td>
                                <td>Gold</td>
                                <td>CAN<sup>a</sup>
                                </td>
                                <td>CAP<sup>b</sup>
                                </td>
                                <td>TieBreak</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Positives</td>
                                <td>1082</td>
                                <td>1082</td>
                                <td>1718</td>
                                <td>1366</td>
                            </tr>
                            <tr valign="top">
                                <td>Negatives</td>
                                <td>1539</td>
                                <td>2175</td>
                                <td>1539</td>
                                <td>1891</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table6fn1">
                            <p>
                                <sup>a</sup>CAN: conflict as negative</p>
                        </fn>
                        <fn id="table6fn2">
                            <p>
                                <sup>b</sup>CAP: conflict as positive</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
                <fig id="figure6" position="float">
                    <label>Figure 6</label>
                    <caption>
                        <p>PR (precision recall) curves for testing on the gold, CAN (conflict as negative), and CAP (conflict as positive) datasets.</p>
                    </caption>
                    <graphic xlink:href="jmir_v17i6e138_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
                <fig id="figure7" position="float">
                    <label>Figure 7</label>
                    <caption>
                        <p>Performance of the SYND (synthetic health issue) classifier with a varying amount of training data.</p>
                    </caption>
                    <graphic xlink:href="jmir_v17i6e138_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <sec>
                <title>Principal Findings</title>
                <p>There are several notable findings from this investigation. First, Twitter users disclose the health status of themselves and others. Second, the health status disclosure rate may depend on the health issue. Third, how people disclose their own and other people&#8217;s health status may also be health issue dependent. Fourth, tweets related with a small group of health issues can train a scalable classifier to detect health mentions on Twitter streams.</p>
                <p>Another interesting phenomenon illustrated from the PR curves (<xref ref-type="fig" rid="figure6">Figure 6</xref>) is that the system classifier, trained with the tweets for which MT masters exhibited high concordance in their labels, is more likely than MT masters to classify tweets with conflict labels as positive. One possible explanation is that the classifier makes its decision based on thousands of examples, while most MT masters made decisions only with the description of the survey, which indicates that the classifier may be more familiar with the labeling task. This suggests there may be a difference between using an expert and crowdsourcing to generate the labeled corpus. However, determining how to best leverage the crowd to mimic an expert is beyond the scope of this investigation.</p>
            </sec>
            <sec>
                <title>Impact on Health Related Research</title>
                <p>According to our investigation, roughly 44% of the tweets containing health issue keywords disclose personal health status. We believe there is a potential for information to assist health care professionals in learning about their patients or their patients&#8217; family medical history, information often missing in the EMRs. This indicates that social media platforms, such as Twitter contains huge amount of personal health care related information that may complement traditional EMRs in research and practice. We recognized that we must still verify the veracity of such data, but an opportunity exists nonetheless.</p>
            </sec>
            <sec>
                <title>Limitations</title>
                <p>We wish to highlight several limitations of this investigation. First, two parameters to extract tweets from Twitter streams require configuration: (1) the set of keywords invoked in the filter, and (2) the geolocation applied to discover tweets. Compared to keywords, geolocation can filter tweets disseminated by authoritative organizations (due to the absence of &#8220;coordinates&#8221; and &#8220;place&#8221; information in these tweets), such as the American Cancer Society, and thus greatly reduce noise. However, it should be noted that invoking such a filter can also exclude the tweets of individuals who choose not to disclose their location. A second limitation exists in the survey provided to the MT masters for labeling the corpus. Specifically, we assumed the N/A option was a member of the negative class, but this could be an incorrect assumption in certain instances. Third, this investigation was restricted to only 34 health-related phenomena, which is clearly only a sample of all possible health issues. The keywords filter service can be enhanced by integrating a laymen health vocabulary [<xref ref-type="bibr" rid="ref42">42</xref>]. Given that this study shows there is (1) high variability in the rate at which people tweet about a certain health issue, and (2) to whom the statement of health issue corresponds, it will be critical to investigate how these methods fare in the context of other health issues.</p>
            </sec>
            <sec>
                <title>Conclusions</title>
                <p>Recent studies demonstrate the information communicated through social media platforms, such as Twitter and Facebook, could supplement traditional medical and epidemiological research. In this paper, we showed that a health mention detection system can be designed and deployed for microblogging systems, such as Twitter. At the same time, we illustrated that the information communicated through such mentions can disclose the health status of the authors and other individuals at a wide range of rates. Our experimental investigation further showed that the combination of tweets from several health issues can yield a classifier that dominates a classifier based on the tweets of a single health issue. This may enable the system to use a small amount of training data to build a classifier that detects health status mentions across a range of health issues. We envision several opportunities for extending this work. First, we believe the scalability of the classifier may be improved by determining the minimal set of health issues and features (eg, more complicated grammar features). Second, we anticipate that the performance of the classifier could be improved be accounting for context, such as dialogue, relationships in the network, and profile information as new supplemental features. Finally, while the rate that health status is disclosed for the author versus other individuals is dependent upon the considered health issue, further investigation is required to determine what drives this disparity. We suspect, for instance, that it may be dependent on the sensitivity and severity of health issues, but this is only a conjecture.</p>
            </sec>
        </sec>
    </body>
    <back>
        <app-group>
            <app id="app1">
                <title>Multimedia Appendix 1</title>
                <p>Example question posed to Mechanical Turk masters.</p>
                <media xlink:href="jmir_v17i6e138_app1.pdf" xlink:title="PDF File (Adobe PDF File), 239KB" />
            </app>
            <app id="app2">
                <title>Multimedia Appendix 2</title>
                <p>Concordance between the system classifier and Mechanical Turk masters.</p>
                <media xlink:href="jmir_v17i6e138_app2.pdf" xlink:title="PDF File (Adobe PDF File), 464KB" />
            </app>
            <app id="app3">
                <title>Multimedia Appendix 3</title>
                <p>Summary of four datasets.</p>
                <media xlink:href="jmir_v17i6e138_app3.pdf" xlink:title="PDF File (Adobe PDF File), 221KB" />
            </app>
            <app id="app4">
                <title>Multimedia Appendix 4</title>
                <p>Keywords used to filter tweets.</p>
                <media xlink:href="jmir_v17i6e138_app4.pdf" xlink:title="PDF File (Adobe PDF File), 216KB" />
            </app>
        </app-group>
        <glossary>
            <title>Abbreviations</title>
            <def-list>
                <def-item>
                    <term id="abb1">AUPRC</term>
                    <def>
                        <p>area under the precision recall curve</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb2">CAP</term>
                    <def>
                        <p>conflict as positive</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb3">CAN</term>
                    <def>
                        <p>conflict as negative</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb4">EMR</term>
                    <def>
                        <p>electronic medical record</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb5">HEC-1</term>
                    <def>
                        <p>heterogeneous classification with &#124;X&#124; = 1</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb6">HEC-N</term>
                    <def>
                        <p>heterogeneous classification with &#124;X&#124; &#62; 1</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb7">HOC-1</term>
                    <def>
                        <p>homogeneous classification with &#124;X&#124; = 1</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb8">HOC-N</term>
                    <def>
                        <p>homogeneous classification with &#124;X&#124; &#62; 1</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb9">KS</term>
                    <def>
                        <p>Kolmogorov-Smirnov Test</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb10">MNB</term>
                    <def>
                        <p>Multinomial Na&#239;ve Bayes</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb11">MT</term>
                    <def>
                        <p>Mechanical Turk</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb12">N/A</term>
                    <def>
                        <p>none of the above</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb13">SYND</term>
                    <def>
                        <p>synthetic health issue</p>
                    </def>
                </def-item>
            </def-list>
        </glossary>
        <ack>
            <p>This research was sponsored in part by grants from the National Science Foundation (CCF-0424422) and the Patient Centered Outcomes Research Institute (CDRN-1306-04869). The authors would like to thank the members of the Mid-South Clinical Data Research Network for useful discussions during the development of this research.</p>
        </ack>
        <fn-group>
            <fn fn-type="conflict">
                <p>None declared.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Garratt</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ruta</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Abdalla</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Buckingham</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Russell</surname>
                            <given-names>I</given-names>
                        </name>
                    </person-group>
                    <article-title>The SF36 health survey questionnaire: an outcome measure suitable for routine use within the NHS?</article-title>
                    <source>BMJ</source>
                    <year>1993</year>
                    <month>05</month>
                    <day>29</day>
                    <volume>306</volume>
                    <issue>6890</issue>
                    <fpage>1440</fpage>
                    <lpage>4</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/8518640" />
                    </comment>
                    <pub-id pub-id-type="medline">8518640</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1677883</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Samsa</surname>
                            <given-names>G P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Matchar</surname>
                            <given-names>D B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Goldstein</surname>
                            <given-names>L B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bonito</surname>
                            <given-names>A J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lux</surname>
                            <given-names>L J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Witter</surname>
                            <given-names>D M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bian</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Quality of anticoagulation management among patients with atrial fibrillation: results of a review of medical records from 2 communities</article-title>
                    <source>Arch Intern Med</source>
                    <year>2000</year>
                    <month>04</month>
                    <day>10</day>
                    <volume>160</volume>
                    <issue>7</issue>
                    <fpage>967</fpage>
                    <lpage>73</lpage>
                    <pub-id pub-id-type="medline">10761962</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Williams</surname>
                            <given-names>L S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yilmaz</surname>
                            <given-names>E Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lopez-Yunez</surname>
                            <given-names>A M</given-names>
                        </name>
                    </person-group>
                    <article-title>Retrospective assessment of initial stroke severity with the NIH Stroke Scale</article-title>
                    <source>Stroke</source>
                    <year>2000</year>
                    <month>04</month>
                    <volume>31</volume>
                    <issue>4</issue>
                    <fpage>858</fpage>
                    <lpage>62</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://stroke.ahajournals.org/cgi/pmidlookup?view=long&#38;pmid=10753988" />
                    </comment>
                    <pub-id pub-id-type="medline">10753988</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Quam</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ellis</surname>
                            <given-names>L B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Venus</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Clouse</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Taylor</surname>
                            <given-names>C G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Leatherman</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>Using claims data for epidemiologic research. The concordance of claims-based criteria with the medical record and patient survey for identifying a hypertensive population</article-title>
                    <source>Med Care</source>
                    <year>1993</year>
                    <month>06</month>
                    <volume>31</volume>
                    <issue>6</issue>
                    <fpage>498</fpage>
                    <lpage>507</lpage>
                    <pub-id pub-id-type="medline">8501997</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wyatt</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Using the Internet for surveys and health research</article-title>
                    <source>J Med Internet Res</source>
                    <year>2002</year>
                    <volume>4</volume>
                    <issue>2</issue>
                    <fpage>E13</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2002/2/e13/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.4.2.e13</pub-id>
                    <pub-id pub-id-type="medline">12554560</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1761932</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Coorevits</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sundgren</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Klein</surname>
                            <given-names>G O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bahr</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Claerhout</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Daniel</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dugas</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dupont</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schmidt</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Singleton</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>De Moor</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kalra</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <article-title>Electronic health records: new opportunities for clinical research</article-title>
                    <source>J Intern Med</source>
                    <year>2013</year>
                    <month>12</month>
                    <volume>274</volume>
                    <issue>6</issue>
                    <fpage>547</fpage>
                    <lpage>60</lpage>
                    <pub-id pub-id-type="doi">10.1111/joim.12119</pub-id>
                    <pub-id pub-id-type="medline">23952476</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Jensen</surname>
                            <given-names>Peter B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jensen</surname>
                            <given-names>Lars J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brunak</surname>
                            <given-names>Søren</given-names>
                        </name>
                    </person-group>
                    <article-title>Mining electronic health records: towards better research applications and clinical care</article-title>
                    <source>Nat Rev Genet</source>
                    <year>2012</year>
                    <month>06</month>
                    <volume>13</volume>
                    <issue>6</issue>
                    <fpage>395</fpage>
                    <lpage>405</lpage>
                    <pub-id pub-id-type="doi">10.1038/nrg3208</pub-id>
                    <pub-id pub-id-type="medline">22549152</pub-id>
                    <pub-id pub-id-type="pii">nrg3208</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Rea</surname>
                            <given-names>Susan</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pathak</surname>
                            <given-names>Jyotishman</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Savova</surname>
                            <given-names>Guergana</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Oniki</surname>
                            <given-names>Thomas A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Westberg</surname>
                            <given-names>Les</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Beebe</surname>
                            <given-names>Calvin E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tao</surname>
                            <given-names>Cui</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Parker</surname>
                            <given-names>Craig G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Haug</surname>
                            <given-names>Peter J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Huff</surname>
                            <given-names>Stanley M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chute</surname>
                            <given-names>Christopher G</given-names>
                        </name>
                    </person-group>
                    <article-title>Building a robust, scalable and standards-driven infrastructure for secondary use of EHR data: the SHARPn project</article-title>
                    <source>J Biomed Inform</source>
                    <year>2012</year>
                    <month>08</month>
                    <volume>45</volume>
                    <issue>4</issue>
                    <fpage>763</fpage>
                    <lpage>71</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S1532-0464(12)00020-2" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1016/j.jbi.2012.01.009</pub-id>
                    <pub-id pub-id-type="medline">22326800</pub-id>
                    <pub-id pub-id-type="pii">S1532-0464(12)00020-2</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Estrin</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <article-title>Small data, where n=me</article-title>
                    <source>Commun ACM</source>
                    <year>2014</year>
                    <month>04</month>
                    <day>01</day>
                    <volume>57</volume>
                    <issue>4</issue>
                    <fpage>32</fpage>
                    <lpage>34</lpage>
                    <pub-id pub-id-type="doi">10.1145/2580944</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kumar</surname>
                            <given-names>Santosh</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nilsen</surname>
                            <given-names>Wendy J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Abernethy</surname>
                            <given-names>Amy</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Atienza</surname>
                            <given-names>Audie</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Patrick</surname>
                            <given-names>Kevin</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pavel</surname>
                            <given-names>Misha</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Riley</surname>
                            <given-names>William T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Shar</surname>
                            <given-names>Albert</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Spring</surname>
                            <given-names>Bonnie</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Spruijt-Metz</surname>
                            <given-names>Donna</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hedeker</surname>
                            <given-names>Donald</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Honavar</surname>
                            <given-names>Vasant</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kravitz</surname>
                            <given-names>Richard</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lefebvre</surname>
                            <given-names>R Craig</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mohr</surname>
                            <given-names>David C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Murphy</surname>
                            <given-names>Susan A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Quinn</surname>
                            <given-names>Charlene</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Shusterman</surname>
                            <given-names>Vladimir</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Swendeman</surname>
                            <given-names>Dallas</given-names>
                        </name>
                    </person-group>
                    <article-title>Mobile health technology evaluation: the mHealth evidence workshop</article-title>
                    <source>Am J Prev Med</source>
                    <year>2013</year>
                    <month>08</month>
                    <volume>45</volume>
                    <issue>2</issue>
                    <fpage>228</fpage>
                    <lpage>36</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23867031" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1016/j.amepre.2013.03.017</pub-id>
                    <pub-id pub-id-type="medline">23867031</pub-id>
                    <pub-id pub-id-type="pii">S0749-3797(13)00277-8</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3803146</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Tomlinson</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rotheram-Borus</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Swartz</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tsai</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>Scaling up mHealth: where is the evidence?</article-title>
                    <source>PLoS Med</source>
                    <year>2013</year>
                    <volume>10</volume>
                    <issue>2</issue>
                    <fpage>e1001382</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pmed.1001382" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pmed.1001382</pub-id>
                    <pub-id pub-id-type="medline">23424286</pub-id>
                    <pub-id pub-id-type="pii">PMEDICINE-D-12-02226</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3570540</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Riedl</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Riedl</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Crowdsourcing medical research</article-title>
                    <source>Computer</source>
                    <year>2013</year>
                    <month>01</month>
                    <volume>46</volume>
                    <issue>1</issue>
                    <fpage>89</fpage>
                    <lpage>92</lpage>
                    <pub-id pub-id-type="doi">10.1109/MC.2013.15</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wicks</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Vaughan</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Heywood</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Subjects no more: what happens when trial participants realize they hold the power?</article-title>
                    <source>BMJ</source>
                    <year>2014</year>
                    <volume>348</volume>
                    <fpage>g368</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24472779" />
                    </comment>
                    <pub-id pub-id-type="medline">24472779</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3905107</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bian</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Topaloglu</surname>
                            <given-names>U</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yu</surname>
                            <given-names>F</given-names>
                        </name>
                    </person-group>
                    <article-title>Towards large-scale Twitter mining for drug- related adverse events</article-title>
                    <source>Proceedings of the 2012 International Workshop on Smart Health and Wellbeing</source>
                    <year>2012</year>
                    <conf-name>International Workshop on Smart Health and Wellbeing</conf-name>
                    <conf-date>2012</conf-date>
                    <conf-loc>Maui, Hawaii, USA</conf-loc>
                    <fpage>25</fpage>
                    <lpage>32</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mukherjee</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Weikum</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Danescu-Niculescu-Mizil</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>People on drugs: credibility of user statements in health communities</article-title>
                    <source>Proceedings of the 20th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>
                    <year>2014</year>
                    <conf-name>20th ACM SIGKDD</conf-name>
                    <conf-date>2014</conf-date>
                    <conf-loc>New York, USA</conf-loc>
                    <fpage>65</fpage>
                    <lpage>74</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bodnar</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Barclay</surname>
                            <given-names>VC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ram</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tucker</surname>
                            <given-names>CS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Salath&#180;e</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>On the ground validation of online diagnosis with Twitter and medical records</article-title>
                    <source>Proceedings of the Companion Publication of the 23rd International Conference on World Wide Web Companion</source>
                    <year>2014</year>
                    <conf-name>23rd International Conference on World Wide Web</conf-name>
                    <conf-date>2014</conf-date>
                    <conf-loc>Seoul, Korea</conf-loc>
                    <fpage>651</fpage>
                    <lpage>656</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="web">
                    <source>Medical Expenditure Panel Survey</source>
                    <access-date>2015-05-13</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://meps.ahrq.gov/mepsweb/">http://meps.ahrq.gov/mepsweb/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6YUMTLNXr</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hale</surname>
                            <given-names>Timothy M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pathipati</surname>
                            <given-names>Akhilesh S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zan</surname>
                            <given-names>Shiyi</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jethwani</surname>
                            <given-names>Kamal</given-names>
                        </name>
                    </person-group>
                    <article-title>Representation of health conditions on Facebook: content analysis and evaluation of user engagement</article-title>
                    <source>J Med Internet Res</source>
                    <year>2014</year>
                    <volume>16</volume>
                    <issue>8</issue>
                    <fpage>e182</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2014/8/e182/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.3275</pub-id>
                    <pub-id pub-id-type="medline">25092386</pub-id>
                    <pub-id pub-id-type="pii">v16i8e182</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4129190</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Paul</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dredze</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Discovering health topics in social media using topic models</article-title>
                    <source>PLoS One</source>
                    <year>2014</year>
                    <volume>9</volume>
                    <issue>8</issue>
                    <fpage>e103408</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0103408" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0103408</pub-id>
                    <pub-id pub-id-type="medline">25084530</pub-id>
                    <pub-id pub-id-type="pii">PONE-D-14-00554</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4118877</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Olejnik</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kutrowska</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Castelluccia</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>I'M 2.8% Neanderthal - The beginning of genetic exhibitionism?</article-title>
                    <source>Workshop on Genome Privacy</source>
                    <year>2014</year>
                    <conf-name>Workshop on Genome Privacy</conf-name>
                    <conf-date>2014</conf-date>
                    <conf-loc>Amsterdam, Netherlands</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hanson</surname>
                            <given-names>Carl L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Burton</surname>
                            <given-names>Scott H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Giraud-Carrier</surname>
                            <given-names>Christophe</given-names>
                        </name>
                        <name name-style="western">
                            <surname>West</surname>
                            <given-names>Josh H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Barnes</surname>
                            <given-names>Michael D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hansen</surname>
                            <given-names>Bret</given-names>
                        </name>
                    </person-group>
                    <article-title>Tweaking and tweeting: exploring Twitter for nonmedical use of a psychostimulant drug (Adderall) among college students</article-title>
                    <source>J Med Internet Res</source>
                    <year>2013</year>
                    <volume>15</volume>
                    <issue>4</issue>
                    <fpage>e62</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/4/e62/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2503</pub-id>
                    <pub-id pub-id-type="medline">23594933</pub-id>
                    <pub-id pub-id-type="pii">v15i4e62</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3636321</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hanson</surname>
                            <given-names>Carl Lee</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cannon</surname>
                            <given-names>Ben</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Burton</surname>
                            <given-names>Scott</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Giraud-Carrier</surname>
                            <given-names>Christophe</given-names>
                        </name>
                    </person-group>
                    <article-title>An exploration of social circles and prescription drug abuse through Twitter</article-title>
                    <source>J Med Internet Res</source>
                    <year>2013</year>
                    <volume>15</volume>
                    <issue>9</issue>
                    <fpage>e189</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/9/e189/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2741</pub-id>
                    <pub-id pub-id-type="medline">24014109</pub-id>
                    <pub-id pub-id-type="pii">v15i9e189</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3785991</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wilson</surname>
                            <given-names>Kumanan</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Keelan</surname>
                            <given-names>Jennifer</given-names>
                        </name>
                    </person-group>
                    <article-title>Social media and the empowering of opponents of medical technologies: the case of anti-vaccinationism</article-title>
                    <source>J Med Internet Res</source>
                    <year>2013</year>
                    <volume>15</volume>
                    <issue>5</issue>
                    <fpage>e103</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/5/e103/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2409</pub-id>
                    <pub-id pub-id-type="medline">23715762</pub-id>
                    <pub-id pub-id-type="pii">v15i5e103</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3668617</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Duke</surname>
                            <given-names>Jennifer C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hansen</surname>
                            <given-names>Heather</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kim</surname>
                            <given-names>Annice E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Curry</surname>
                            <given-names>Laurel</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Allen</surname>
                            <given-names>Jane</given-names>
                        </name>
                    </person-group>
                    <article-title>The use of social media by state tobacco control programs to promote smoking cessation: a cross-sectional study</article-title>
                    <source>J Med Internet Res</source>
                    <year>2014</year>
                    <volume>16</volume>
                    <issue>7</issue>
                    <fpage>e169</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2014/7/e169/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.3430</pub-id>
                    <pub-id pub-id-type="medline">25014311</pub-id>
                    <pub-id pub-id-type="pii">v16i7e169</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4115651</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cobb</surname>
                            <given-names>NK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jacobs</surname>
                            <given-names>MA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Saul</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wileyto</surname>
                            <given-names>EP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Graham</surname>
                            <given-names>AL</given-names>
                        </name>
                    </person-group>
                    <article-title>Diffusion of an evidence-based smoking cessation intervention through Facebook: a randomised controlled trial study protocol</article-title>
                    <source>BMJ Open</source>
                    <year>2014</year>
                    <volume>4</volume>
                    <issue>1</issue>
                    <fpage>e004089</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bmjopen.bmj.com/cgi/pmidlookup?view=long&#38;pmid=24448847" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/bmjopen-2013-004089</pub-id>
                    <pub-id pub-id-type="medline">24448847</pub-id>
                    <pub-id pub-id-type="pii">bmjopen-2013-004089</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3902462</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Jaganath</surname>
                            <given-names>Devan</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gill</surname>
                            <given-names>Harkiran K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cohen</surname>
                            <given-names>Adam Carl</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Young</surname>
                            <given-names>Sean D</given-names>
                        </name>
                    </person-group>
                    <article-title>Harnessing Online Peer Education (HOPE): integrating C-POL and social media to train peer leaders in HIV prevention</article-title>
                    <source>AIDS Care</source>
                    <year>2012</year>
                    <volume>24</volume>
                    <issue>5</issue>
                    <fpage>593</fpage>
                    <lpage>600</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22149081" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1080/09540121.2011.630355</pub-id>
                    <pub-id pub-id-type="medline">22149081</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3342451</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Aramaki</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Maskawa</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Morita</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Twitter catches the flu: detecting influenza epidemics using Twitter</article-title>
                    <source>Proceedings of the Conference on Empirical Methods in Natural Language Processing</source>
                    <year>2011</year>
                    <conf-name>Conference on Empirical Methods in Natural Language Processing</conf-name>
                    <conf-date>2011</conf-date>
                    <conf-loc>Edinburgh, United Kingdom</conf-loc>
                    <fpage>1568</fpage>
                    <lpage>1576</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Nagar</surname>
                            <given-names>Ruchit</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yuan</surname>
                            <given-names>Qingyu</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Freifeld</surname>
                            <given-names>Clark C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Santillana</surname>
                            <given-names>Mauricio</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nojima</surname>
                            <given-names>Aaron</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chunara</surname>
                            <given-names>Rumi</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brownstein</surname>
                            <given-names>John S</given-names>
                        </name>
                    </person-group>
                    <article-title>A case study of the New York City 2012-2013 influenza season with daily geocoded Twitter data from temporal and spatiotemporal perspectives</article-title>
                    <source>J Med Internet Res</source>
                    <year>2014</year>
                    <volume>16</volume>
                    <issue>10</issue>
                    <fpage>e236</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2014/10/e236/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.3416</pub-id>
                    <pub-id pub-id-type="medline">25331122</pub-id>
                    <pub-id pub-id-type="pii">v16i10e236</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4259880</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref29">
                <label>29</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Nagel</surname>
                            <given-names>Anna C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tsou</surname>
                            <given-names>Ming-Hsiang</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Spitzberg</surname>
                            <given-names>Brian H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>An</surname>
                            <given-names>Li</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gawron</surname>
                            <given-names>J Mark</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gupta</surname>
                            <given-names>Dipak K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yang</surname>
                            <given-names>Jiue-An</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Han</surname>
                            <given-names>Su</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Peddecord</surname>
                            <given-names>K Michael</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lindsay</surname>
                            <given-names>Suzanne</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sawyer</surname>
                            <given-names>Mark H</given-names>
                        </name>
                    </person-group>
                    <article-title>The complex relationship of realspace events and messages in cyberspace: case study of influenza and pertussis using tweets</article-title>
                    <source>J Med Internet Res</source>
                    <year>2013</year>
                    <volume>15</volume>
                    <issue>10</issue>
                    <fpage>e237</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/10/e237/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2705</pub-id>
                    <pub-id pub-id-type="medline">24158773</pub-id>
                    <pub-id pub-id-type="pii">v15i10e237</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3841359</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref30">
                <label>30</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Curtis</surname>
                            <given-names>Brenda L</given-names>
                        </name>
                    </person-group>
                    <article-title>Social networking and online recruiting for HIV research: ethical challenges</article-title>
                    <source>J Empir Res Hum Res Ethics</source>
                    <year>2014</year>
                    <month>02</month>
                    <volume>9</volume>
                    <issue>1</issue>
                    <fpage>58</fpage>
                    <lpage>70</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24572084" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1525/jer.2014.9.1.58</pub-id>
                    <pub-id pub-id-type="medline">24572084</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4316828</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref31">
                <label>31</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lazer</surname>
                            <given-names>DM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kennedy</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>King</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Vespignani</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>Big data. The parable of Google Flu: traps in big data analysis</article-title>
                    <source>Science</source>
                    <year>2014</year>
                    <month>03</month>
                    <day>14</day>
                    <volume>343</volume>
                    <issue>6176</issue>
                    <fpage>1203</fpage>
                    <lpage>5</lpage>
                    <pub-id pub-id-type="doi">10.1126/science.1248506</pub-id>
                    <pub-id pub-id-type="medline">24626916</pub-id>
                    <pub-id pub-id-type="pii">343/6176/1203</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref32">
                <label>32</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mao</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Shuai</surname>
                            <given-names>X</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kapadia</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>Loose tweets: an analysis of privacy leaks on Twitter</article-title>
                    <source>Proceedings of the 10th Annual ACM Workshop on Privacy in the Electronic Society</source>
                    <year>2011</year>
                    <conf-name>ACM Workshop on Privacy in the Electronic Society</conf-name>
                    <conf-date>2011</conf-date>
                    <conf-loc>Chicago, Illinois</conf-loc>
                    <fpage>1</fpage>
                    <lpage>12</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref33">
                <label>33</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lamb</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Paul</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dredze</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Separating fact from fear: tracking flu infections on Twitter</article-title>
                    <source>Proceedings of HLT-NAACL</source>
                    <year>2013</year>
                    <conf-name>Human Language Technologies: Conference of the North American Chapter of the Association of Computational Linguistics</conf-name>
                    <conf-date>2013</conf-date>
                    <conf-loc>Atlanta, Georgia</conf-loc>
                    <fpage>789</fpage>
                    <lpage>795</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref34">
                <label>34</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Gattani</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Doan</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lamba</surname>
                            <given-names>Ds</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Garera</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tiwari</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chai</surname>
                            <given-names>X</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Das</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Subramaniam</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rajaraman</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Harinarayan</surname>
                            <given-names>V</given-names>
                        </name>
                    </person-group>
                    <article-title>Entity extraction, linking, classification, and tagging for social media</article-title>
                    <source>Proc VLDB Endow</source>
                    <year>2013</year>
                    <month>08</month>
                    <day>27</day>
                    <volume>6</volume>
                    <issue>11</issue>
                    <fpage>1126</fpage>
                    <lpage>1137</lpage>
                    <pub-id pub-id-type="doi">10.14778/2536222.2536237</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref35">
                <label>35</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Yang</surname>
                            <given-names>SH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kolcz</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schlaikjer</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gupta</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Large-scale high-precision topic modeling on Twitter</article-title>
                    <source>Proceedings of the 20th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>
                    <year>2014</year>
                    <conf-name>ACM SIGKDD</conf-name>
                    <conf-date>2014</conf-date>
                    <conf-loc>New York, USA</conf-loc>
                    <fpage>1907</fpage>
                    <lpage>1916</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref36">
                <label>36</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Banerjee</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chakraborty</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dasgupta</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mittal</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Joshi</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nagar</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>User interests in social media sites: an exploration with micro- blogs</article-title>
                    <source>Proceedings of the 18th ACM Conference on Information and Knowledge Management</source>
                    <year>2009</year>
                    <conf-name>ACM Conference on Information and Knowledge Management</conf-name>
                    <conf-date>2009</conf-date>
                    <conf-loc>Hong Kong, China</conf-loc>
                    <fpage>1823</fpage>
                    <lpage>1826</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref37">
                <label>37</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Davidov</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tsur</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rappoport</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>Semi-supervised recognition of sarcastic sentences in Twitter and Amazon</article-title>
                    <source>Proceedings of the Fourteenth Conference on Computational Natural Language Learning</source>
                    <year>2010</year>
                    <conf-name>Conference on Computational Natural Language Learning</conf-name>
                    <conf-date>2010</conf-date>
                    <conf-loc>Uppsala, Sweden</conf-loc>
                    <fpage>107</fpage>
                    <lpage>116</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref38">
                <label>38</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Sriram</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Fuhry</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Demir</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ferhatosmanoglu</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Demirbas</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Short text classification in Twitter to improve information filtering</article-title>
                    <source>Proceedings of the 33rd International ACM SIGIR Conference on Research and Development in Information Retrieval</source>
                    <year>2010</year>
                    <conf-name>ACM SIGIR</conf-name>
                    <conf-date>2010</conf-date>
                    <conf-loc>Geneva, Switzerland</conf-loc>
                    <fpage>841</fpage>
                    <lpage>842</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref39">
                <label>39</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Banerjee</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chakraborty</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Joshi</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mittal</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rai</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ravindran</surname>
                            <given-names>B</given-names>
                        </name>
                    </person-group>
                    <article-title>Towards analyzing micro-blogs for detection and classification of real-time intentions</article-title>
                    <source>Proceedings of the 6th International AAAI Conference on Weblogs and Social Media</source>
                    <year>2012</year>
                    <conf-name>International AAAI Conference on Weblogs and Social Media</conf-name>
                    <conf-date>2012</conf-date>
                    <conf-loc>Dublin, Ireland</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref40">
                <label>40</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Davis</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Goadrich</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>The relationship between Precision-Recall and ROC curves</article-title>
                    <source>Proceedings of the 23rd International Conference on Machine Learning</source>
                    <year>2006</year>
                    <conf-name>International Conference on Machine Learning</conf-name>
                    <conf-date>2006</conf-date>
                    <conf-loc>Pittsburgh, Pennsylvania</conf-loc>
                    <fpage>233</fpage>
                    <lpage>240</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref41">
                <label>41</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cer</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>de Marneffe</surname>
                            <given-names>MC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jurafsky</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Manning</surname>
                            <given-names>CD</given-names>
                        </name>
                    </person-group>
                    <article-title>Parsing to Stanford dependencies: trade-offs between speed and accuracy</article-title>
                    <source>Proceedings of the International Conference on Language Resources and Evaluation</source>
                    <year>2010</year>
                    <conf-name>International Conference on Language Resources and Evaluation</conf-name>
                    <conf-date>2010</conf-date>
                    <conf-loc>Valletta, Malta</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref42">
                <label>42</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Vydiswaran</surname>
                            <given-names>V</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mei</surname>
                            <given-names>Q</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hanauer</surname>
                            <given-names>DA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zheng</surname>
                            <given-names>K</given-names>
                        </name>
                    </person-group>
                    <article-title>Mining consumer health vocabulary from community-generated text</article-title>
                    <source>Proceedings of the American Medical Informatics Association Annual Symposium (AMIA)</source>
                    <year>2014</year>
                    <conf-name>AMIA</conf-name>
                    <conf-date>2014</conf-date>
                    <conf-loc>Washington, DC</conf-loc>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>
