<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">JMIR</journal-id>
            <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
            <journal-title>Journal of Medical Internet Research</journal-title>
            <issn pub-type="epub">1438-8871</issn>
            <publisher>
                <publisher-name>JMIR Publications Inc.</publisher-name>
                <publisher-loc>Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v17i8e194</article-id>
            <article-id pub-id-type="pmid">26250986</article-id>
            <article-id pub-id-type="doi">10.2196/jmir.4308</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Original Paper</subject>
                </subj-group>
                <subj-group subj-group-type="article-type">
                    <subject>Original Paper</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>A Study of the Demographics of Web-Based Health-Related Social Media Users</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="editor">
                    <name>
                        <surname>Eysenbach</surname>
                        <given-names>Gunther</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Luo</surname>
                        <given-names>Gang</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Tremblay</surname>
                        <given-names>Monica</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1" corresp="yes">
                    <name name-style="western">
                        <surname>Sadah</surname>
                        <given-names>Shouq A</given-names>
                    </name>
                    <degrees>MS</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <address>
                        <institution>Department of Computer Science and Engineering</institution>
                        <institution>University of California, Riverside</institution>
                        <addr-line>351 Winston Chung Hall</addr-line>
                        <addr-line>900 University Ave</addr-line>
                        <addr-line>Riverside, CA, 92521</addr-line>
                        <country>United States</country>
                        <phone>1 9517565691</phone>
                        <fax>1 9518274643</fax>
                        <email>ssada003@cs.ucr.edu</email>
                    </address>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-5203-4355</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib2">
                    <name name-style="western">
                        <surname>Shahbazi</surname>
                        <given-names>Moloud</given-names>
                    </name>
                    <degrees>MS</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-8031-0169</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib3">
                    <name name-style="western">
                        <surname>Wiley</surname>
                        <given-names>Matthew T</given-names>
                    </name>
                    <degrees>MS</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <xref rid="aff2" ref-type="aff">2</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-9441-3786</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib4">
                    <name name-style="western">
                        <surname>Hristidis</surname>
                        <given-names>Vagelis</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-8679-4988</ext-link>
                </contrib>
            </contrib-group>
            <aff id="aff1">
                <sup>1</sup>
                <institution>Department of Computer Science and Engineering</institution>
                <institution>University of California, Riverside</institution>
                <addr-line>Riverside, CA</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff2">
                <sup>2</sup>
                <institution>SmartDocFinder LLC</institution>
                <addr-line>Riverside, CA</addr-line>
                <country>United States</country>
            </aff>
            <author-notes>
                <corresp>Corresponding Author: Shouq A Sadah <email>ssada003@cs.ucr.edu</email>
                </corresp>
            </author-notes>
            <pub-date pub-type="collection">
                <month>08</month>
                <year>2015</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>06</day>
                <month>08</month>
                <year>2015</year>
            </pub-date>
            <volume>17</volume>
            <issue>8</issue>
            <elocation-id>e194</elocation-id>
            <!--history from ojs - api-xml-->
            <history>
                <date date-type="received">
                    <day>2</day>
                    <month>2</month>
                    <year>2015</year>
                </date>
                <date date-type="rev-request">
                    <day>12</day>
                    <month>3</month>
                    <year>2015</year>
                </date>
                <date date-type="rev-recd">
                    <day>15</day>
                    <month>6</month>
                    <year>2015</year>
                </date>
                <date date-type="accepted">
                    <day>3</day>
                    <month>7</month>
                    <year>2015</year>
                </date>
            </history>
            <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
            <copyright-statement>&#169;Shouq A Sadah, Moloud Shahbazi, Matthew T Wiley, Vagelis Hristidis. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 06.08.2015. </copyright-statement>
            <copyright-year>2015</copyright-year>
            <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
                <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
            </license>
            <self-uri xlink:href="http://www.jmir.org/2015/8/e194/" xlink:type="simple" />
            <abstract>
                <sec sec-type="background">
                    <title>Background</title>
                    <p>The rapid spread of Web-based social media in recent years has impacted how patients share health-related information. However, little work has studied the demographics of these users.</p>
                </sec>
                <sec sec-type="objective">
                    <title>Objective</title>
                    <p>Our aim was to study the demographics of users who participate in health-related Web-based social outlets to identify possible links to health care disparities.</p>
                </sec>
                <sec sec-type="methods">
                    <title>Methods</title>
                    <p>We analyze and compare three different types of health-related social outlets: (1) general Web-based social networks, Twitter and Google+, (2) drug review websites, and (3) health Web forums. We focus on the following demographic attributes: age, gender, ethnicity, location, and writing level. We build and evaluate domain-specific classifiers to infer missing data where possible. The estimated demographic statistics are compared against various baselines, such as Internet and social networks usage of the population.</p>
                </sec>
                <sec sec-type="results">
                    <title>Results</title>
                    <p>We found that (1) drug review websites and health Web forums are dominated by female users, (2) the participants of health-related social outlets are generally older with the exception of the 65+ years bracket, (3) blacks are underrepresented in health-related social networks, (4) users in areas with better access to health care participate more in Web-based health-related social outlets, and (5) the writing level of users in health-related social outlets is significantly lower than the reading level of the population.</p>
                </sec>
                <sec sec-type="conclusions">
                    <title>Conclusions</title>
                    <p>We identified interesting and actionable disparities in the participation of various demographic groups to various types of health-related social outlets. These disparities are significantly distinct from the disparities in Internet usage or general social outlets participation.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>online social media</kwd>
                <kwd>demographics</kwd>
                <kwd>health forums</kwd>
                <kwd>health care disparity</kwd>
                <kwd>drug reviews</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title>Introduction</title>
            <sec>
                <title>Background</title>
                <p>Social media have been employed in many industries to engage consumers. The health care industry has moved at a slower pace in incorporating social media because of inherent risks such as patient privacy, but recently this rate has increased to&#160;fulfill&#160;the consumers&#8217; needs [<xref ref-type="bibr" rid="ref1">1</xref>]. Moreover, some companies use social media to provide their employees with wellness videos in order to cut their health care costs [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
                <p>At the same time, health care disparity is a well-studied problem in which two population groups receive unequal services [<xref ref-type="bibr" rid="ref3">3</xref>]. This problem has been analyzed across various dimensions relating to social determinants in health, including education and income, environmental hazards, and health outcomes such as mortality, morbidity, and behavioral risk factors [<xref ref-type="bibr" rid="ref4">4</xref>]. However, health care disparity has not been studied in terms of social media participation. This is important as Internet access and participation in health communities has the potential to improve health outcomes [<xref ref-type="bibr" rid="ref5">5</xref>]. Hence, understanding the demographics of social outlets, which is the focus of this paper, may shed light on another facet of health care disparity.</p>
                <p>To cover different types of Web-based social outlets, we collected data from three types of sources: (1) general Web-based social networks, namely Google+ and Twitter, (2) drug review websites, and (3) health Web forums. We measure the following demographic attributes: age, gender, ethnicity, location, and writing level. Unfortunately, much of this information is unavailable for some, or all, of the sources. For that, we built and evaluated three classifiers for gender, ethnicity, and writing level. User names were used for the gender and ethnicity classifiers. Writing level for users was calculated using modified reading level formula to ignore very long incomprehensible sentences. To extract the location of a post, we use a geocoding application programming interface (API).</p>
            </sec>
            <sec>
                <title>Related Work</title>
                <sec>
                    <title>Analysis of Health-Related Social Outlets</title>
                    <p>Many researchers have explored the effectiveness of Web-based social media in changing and improving the communication between providers and patients. According to Kane et al [<xref ref-type="bibr" rid="ref6">6</xref>], 60 million Americans are using Health 2.0 applications, that is, social networks focused specifically on health care. Further, approximately 40% of Americans find an opinion in social media is more trustworthy if it conflicts with a professional&#8217;s opinion or diagnosis. Hackworth and Kunz [<xref ref-type="bibr" rid="ref7">7</xref>] found that 80% of American adults have looked online for health-related topics. Recently, there is increased interest in analyzing the health-related content of social media [<xref ref-type="bibr" rid="ref1">1</xref>]. Denecke and Nejdl [<xref ref-type="bibr" rid="ref8">8</xref>] analyzed medical concepts mentioned in medical social media posts from different sources to differentiate between informative and affective posts. They found that patients and nurses tend to share personal experiences, while physicians share health-related information. Lu et al [<xref ref-type="bibr" rid="ref9">9</xref>] studied the content of three disease-specific health communities and their relationship to five informative topics: symptoms, complications, examination, drugs, and procedures. For example, users with breast cancer are more likely to discuss examination, while users with lung cancer are more likely to discuss symptoms. Wiley et al [<xref ref-type="bibr" rid="ref10">10</xref>] analyzed the content of Web-based social media related to pharmaceutical drugs across several dimensions, including frequently mentioned diseases, keywords, and sentiment. While the aforementioned work examined health-related social media and content, none of them studied the demographics of the participating users, which is studied in this work.</p>
                </sec>
                <sec>
                    <title>Measuring and Estimating Demographics of Users of Social Outlets</title>
                    <sec>
                        <title>Survey-Based Methods</title>
                        <p>In 2012, a Pew Internet Research study showed that women, age 30-49, are more likely to participate in social media websites, where 75% of users are white [<xref ref-type="bibr" rid="ref11">11</xref>]. eMarketer found that 68.9% of Hispanics use social media compared to 66.2% of the total population. Further, they showed that Hispanics are more likely to compare products online while shopping and write reviews on products [<xref ref-type="bibr" rid="ref12">12</xref>]. However, no research has focused on health-related social media.</p>
                    </sec>
                    <sec>
                        <title>Classifier-Based Methods</title>
                        <p>Mislove et al [<xref ref-type="bibr" rid="ref13">13</xref>] built methods to estimate both gender and ethnicity for Twitter users using the 1000 most popular first names reported by the US Social Security Administration and frequently occurring surnames reported by the 2000 US census. Gender and ethnicity methods used the reported first name and last name respectively. Mandel et al [<xref ref-type="bibr" rid="ref14">14</xref>] analyzed the tweets related to Hurricane Irene using Mislove&#8217;s gender classifier. We build on Mislove&#8217;s work when creating our classifiers. While we also classify gender using first names, we extended these methods to screen names when a first name is not present. A related work for estimating reading levels of the US population [<xref ref-type="bibr" rid="ref15">15</xref>] was presented to discuss limitations of low literacy patients. We measured the writing level based on this work since we did not encounter any similar work.</p>
                    </sec>
                </sec>
            </sec>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <sec>
                <title>Datasets</title>
                <p>Our analysis used data collected from three different types of health-related social outlets: general social networks, drug review websites, and health Web forums (<xref ref-type="table" rid="table1">Table 1</xref> [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref23">23</xref>]). Google+ and Twitter were chosen as general social networks based on their popularity and number of users (we do not study Facebook because it offers no public interfaces to access its data). For drug review websites and health Web forums, three websites were selected for each, where we considered their breadth of topics and popularity. <xref ref-type="fig" rid="figure1">Figure 1</xref> shows the overall process of our analysis, and <xref ref-type="table" rid="table1">Table 1</xref> shows key statistics of each source including number of users, number of posts, and average sentence length. More information about the sources including start and end date is available in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>.</p>
                <table-wrap position="float" id="table1">
                    <label>Table 1</label>
                    <caption>
                        <p>Total number of users, posts, and average sentences length for each source.</p>
                    </caption>
                    <table width="638" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="191" />
                        <col width="121" />
                        <col width="121" />
                        <col width="149" />
                        <thead>
                            <tr valign="top">
                                <td>Dataset</td>
                                <td>Users, n</td>
                                <td>Posts, n</td>
                                <td>Average sentence length (in words)</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>TwitterHealth [<xref ref-type="bibr" rid="ref16">16</xref>]</td>
                                <td>5,095,849</td>
                                <td>11,637,888</td>
                                <td>10.82</td>
                            </tr>
                            <tr valign="top">
                                <td>Google+Health [<xref ref-type="bibr" rid="ref17">17</xref>]</td>
                                <td>86,749</td>
                                <td>186,666</td>
                                <td>9.03</td>
                            </tr>
                            <tr valign="top">
                                <td>Drugs.com [<xref ref-type="bibr" rid="ref18">18</xref>]</td>
                                <td>74,461</td>
                                <td>74,461</td>
                                <td>13.85</td>
                            </tr>
                            <tr valign="top">
                                <td>DailyStrength/Treatments [<xref ref-type="bibr" rid="ref19">19</xref>]</td>
                                <td>213,524</td>
                                <td>1,055,603</td>
                                <td>11.92</td>
                            </tr>
                            <tr valign="top">
                                <td>WebMD/Drugs [<xref ref-type="bibr" rid="ref20">20</xref>]</td>
                                <td>122,040</td>
                                <td>122,040</td>
                                <td>13.53</td>
                            </tr>
                            <tr valign="top">
                                <td>Drugs.com/Answers [<xref ref-type="bibr" rid="ref21">21</xref>]</td>
                                <td>201,126</td>
                                <td>5,948,877</td>
                                <td>6.59</td>
                            </tr>
                            <tr valign="top">
                                <td>DailyStrength/Forums [<xref ref-type="bibr" rid="ref22">22</xref>]</td>
                                <td>165,045</td>
                                <td>1,128,629</td>
                                <td>13.2</td>
                            </tr>
                            <tr valign="top">
                                <td>WebMD [<xref ref-type="bibr" rid="ref23">23</xref>]</td>
                                <td>155,912</td>
                                <td>320,118</td>
                                <td>15.37</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <p>
                    <xref ref-type="table" rid="table2">Table 2</xref> shows which of the sources provide data for each of the five demographic attributes. Two demographic attributes are not present in any source: ethnicity and writing level. We therefore created methods to automatically classify these attributes, along with gender for the sources where unavailable. <italic>No</italic> indicates that the demographic attribute is not provided by the source. <italic>Yes</italic> indicates that the demographic attribute is provided by the source. Each classifier uses a distinct part of the user profile as denoted by the table footnotes. The writing level classifier uses the Flesch-Kincaid measure based on all users&#8217; posts [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
                <table-wrap position="float" id="table2">
                    <label>Table 2</label>
                    <caption>
                        <p>List of all used sources with the available attributes.</p>
                    </caption>
                    <table width="671" border="0" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="157" />
                        <col width="28" />
                        <col width="102" />
                        <col width="112" />
                        <col width="55" />
                        <col width="133" />
                        <thead>
                            <tr valign="top">
                                <td>Dataset</td>
                                <td>Age</td>
                                <td>Gender</td>
                                <td>Ethnicity</td>
                                <td>Location</td>
                                <td>Writing level</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>TwitterHealth</td>
                                <td>No</td>
                                <td>Gender classifier<sup>a</sup>
                                </td>
                                <td rowspan="2">Ethnicity classifier<sup>b</sup>
                                </td>
                                <td>Yes</td>
                                <td>Writing level classifier</td>
                            </tr>
                            <tr valign="top">
                                <td>Google+Health</td>
                                <td>Yes</td>
                                <td>Yes</td>
                                <td>Yes</td>
                                <td>Writing level classifier</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Drugs.com</td>
                                <td>No</td>
                                <td>Gender classifier<sup>c</sup>
                                </td>
                                <td>No</td>
                                <td>No</td>
                                <td>Writing level classifier</td>
                            </tr>
                            <tr valign="top">
                                <td>DailyStrength/Treatments</td>
                                <td>Yes</td>
                                <td>Yes</td>
                                <td>No</td>
                                <td>Yes</td>
                                <td>Writing level classifier</td>
                            </tr>
                            <tr valign="top">
                                <td>WebMD/Drugs</td>
                                <td>Yes</td>
                                <td>Yes</td>
                                <td>No</td>
                                <td>No</td>
                                <td>Writing level classifier</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Drugs.com/Answers</td>
                                <td>No</td>
                                <td>Gender classifier<sup>c</sup>
                                </td>
                                <td>No</td>
                                <td>No</td>
                                <td>Writing level classifier</td>
                            </tr>
                            <tr valign="top">
                                <td>DailyStrength/Forums</td>
                                <td>Yes</td>
                                <td>Yes</td>
                                <td>No</td>
                                <td>Yes</td>
                                <td>Writing level classifier</td>
                            </tr>
                            <tr valign="bottom">
                                <td>WebMD</td>
                                <td>No</td>
                                <td>Gender classifier<sup>c</sup>
                                </td>
                                <td>No</td>
                                <td>No</td>
                                <td>Writing level classifier</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table2fn1">
                            <p>
                                <sup>a</sup>First name.</p>
                        </fn>
                        <fn id="table2fn2">
                            <p>
                                <sup>b</sup>Last name.</p>
                        </fn>
                        <fn id="table2fn3">
                            <p>
                                <sup>c</sup>Screen name.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
                <p>To filter health-related posts from Twitter and Google+, we built a list of 276 representative health-related keywords based on five categories:</p>
                <list list-type="order">
                    <list-item>
                        <p>Drugs: First we obtained a list of the 200 most popular drugs by&#160;prescriptions dispensed from RxList.com [<xref ref-type="bibr" rid="ref25">25</xref>]. We then removed variants of the same drug (eg, different milligram dosages) resulting in 125 unique drug names.&#160;</p>
                    </list-item>
                    <list-item>
                        <p>Hashtags: We selected 11 popular health-related Twitter hashtags such as #HCSM (Healthcare Communications &#38; Social Media).</p>
                    </list-item>
                    <list-item>
                        <p>Disorders: We selected 81 popular disorders such as cancer and Alzheimer.&#160;</p>
                    </list-item>
                    <list-item>
                        <p>Pharmaceuticals: We selected the 12 largest pharmaceutical companies such as Pfizer.</p>
                    </list-item>
                    <list-item>
                        <p>Insurance: We selected 44 of the biggest insurances such as Medicare and Humana. A complete list of used keywords can be found in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>.</p>
                    </list-item>
                </list>
                <p>We used the Twitter streaming API [<xref ref-type="bibr" rid="ref26">26</xref>], with these keywords as filters, to obtain the relevant tweets for our TwitterHealth dataset. Our Google+Health dataset was collected via the Google+ API [<xref ref-type="bibr" rid="ref27">27</xref>], where each health-related keyword was used as a query to find relevant posts. For the drug review websites and health Web forums, we built custom crawlers in Java using the jsoup [<xref ref-type="bibr" rid="ref28">28</xref>] library for crawling and parsing the hypertext markup language (HTML) content. For each source, we collected the available data, including user information, posts, disorder, or condition under which a discussion appears, keywords, tags, etc<italic>.</italic> We emphasize that we collected only publicly available data in accordance with each site&#8217;s terms of use; no private data were collected.</p>
                <fig id="figure1" position="float">
                    <label>Figure 1</label>
                    <caption>
                        <p>Overview of the data collection and analysis process.</p>
                    </caption>
                    <graphic xlink:href="jmir_v17i8e194_fig1.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>User Demographics Estimation Methods</title>
                <sec>
                    <title>Overview</title>
                    <p>We chose five demographic attributes as shown in <xref ref-type="table" rid="table2">Table 2</xref>: gender, age, ethnicity, location, and writing level. Since these attributes are not available in every source, we created several classifiers to derive missing attributes as specified in <xref ref-type="table" rid="table2">Table 2</xref>. Note that we do not fill missing values of users for sources that provide this information for at least some of their users, for example, if a user does not provide their age in Google+, we just ignore this user from the age-related analysis. <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref> shows the percentages of users who report each attribute in each source.</p>
                </sec>
                <sec>
                    <title>Gender</title>
                    <p>Four out of eight sources (Google+Health, DailyStrength/Treatments, WebMD/Drugs, and DailyStrength/Forums) allow users to report their gender (as shown in <xref ref-type="table" rid="table2">Table 2</xref>). Approximately 80% of the users of these sources chose to report it; thus, the reported gender was used for these sources.</p>
                    <p>For the other sources where gender is not available, we extended the methods of Mislove et al [<xref ref-type="bibr" rid="ref13">13</xref>] to classify gender using the reported first name of users, if available; otherwise we extracted first names from user screen names. Note that screen names have not been used before, to the best of our knowledge, for gender estimation. In particular, we first collected the 1000 most popular male and female birth names reported by the US Social Security Administration [<xref ref-type="bibr" rid="ref29">29</xref>] for each year from 1935 to 1995. Thus, we collected the names of people in 2014 aged 19-79 years old, which constitutes about 73.9% of the population [<xref ref-type="bibr" rid="ref30">30</xref>]. There are 55,973 unique names in total. We further filtered this list to remove names with an aggregated frequency less than 10,000 or a discriminative gender probability less than 95%. The resultant list contained 1328 names. For TwitterHealth and Google+Health, we checked if one of these 1328 first names is contained in the user-specified name to classify the user&#8217;s gender. We first cleaned the first name by removing non-alphabetical characters and then performed case-insensitive string matching. Gender classifier evaluation is reported in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>; the accuracy ranges from 76% to 99%.</p>
                </sec>
                <sec>
                    <title>Age</title>
                    <p>Similarly, age was also reported in four sources (Google+Health, DailyStrength/Treatments, WebMD/Drugs, and DailyStrength/Forums).Three sources display the age as a single number, whereas one source displays age as a range (eg, 35-45). Approximately 61% of the users of these sources reported their age. When users provide an age range, the total number of users for each range is distributed uniformly to each year in the range. Ages are then grouped into five age groups: 0-17, 18-34, 35-44, 45-64, and 65 years and older. These age ranges are also used by the US census [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
                </sec>
                <sec>
                    <title>Ethnicity</title>
                    <p>The ethnicity of the users is not reported in any of the sources that we study; therefore, we created an ethnicity classifier similar to&#160;Mislove et al [<xref ref-type="bibr" rid="ref13">13</xref>]. The 2000 US census, which is the most recent available, reports the distribution of ethnicities for each last name (last names with less than 100 individuals were omitted) [<xref ref-type="bibr" rid="ref32">32</xref>]. For example, the distribution for Hernandez is reported as 4.55% white, 0.38% black, 0.27% Asian, and 93.81% Hispanic. We filtered this list to remove the last names with a frequency less than 1000, or where the discriminative probability of the majority ethnicity is less than 80%. We then use the ethnicity with the majority probability to classify ethnicity based on last name for sources that include the last name of users (Google+Health and TwitterHealth). We understand that race and ethnicity are not the same especially when referring to Hispanics, but in this paper we try to simplify the presentation by only reporting ethnicity, that is, we do not distinguish groups like white Hispanic versus black Hispanic, but only Hispanic. For the other sources (health Web forums and drug review websites), which do not have user names, we found that using the screen name for ethnicity estimation is inaccurate, and hence we do not report on the ethnicity of these sources. Ethnicity labeling and classifier evaluation is reported in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>.</p>
                </sec>
                <sec>
                    <title>Writing Level</title>
                    <p>Different methods and formulas for measuring readability are available using different factors such as average number of syllables per words, average number of words per sentences, or average number of letters per words. In our work, we used the Flesch-Kincaid Grade Level [<xref ref-type="bibr" rid="ref16">16</xref>] formula to estimate the writing level (values generally correspond to school grades 1-12) of the users:</p>
                    <p>Flesch-Kincaid Reading Age = (0.39 x ASL) + (11.8 x ASW) &#8211; 15.59, where ASL is the Average Sentence Length, and ASW is the Average number of Syllables per Word.</p>
                    <p>Note that since we can only observe the text authored by users, we measure the writing level and not the reading level; however, we use the reading level formula since no alternative formula for the writing level exists. The writing level of a user is computed using the above equation by concatenating all of the user&#8217;s posts and personal description. Links and hashtags from tweets are removed, and users with less than 100 words in total are ignored. We found that very high reading level was being assigned to users who write very long incomprehensible sentences. This is a case that was not considered by the original Flesch-Kincaid reading age formula, which assumed that the text is grammatically and syntactically correct (eg, the text of a novel). For that, we omit sentences with more than 30 words.</p>
                </sec>
            </sec>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <sec>
                <title>Overview</title>
                <p>To put our results in perspective, we compare them with other general demographics statistics. The population and Internet usage for each demographic group was obtained from the US census [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>], while other statistics for Twitter and Google+ came from other sources [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref35">35</xref>]. Further, we compare the demographics of the users participating in health-related discussions on Twitter and Google+ to the overall demographics of the users in these sites. All our results are statistically significant, except the comparison between health Web forums and drug review websites with respect to gender and age group (0-17). Also, there is no significant difference between Google+Health and drug review websites for age group (35-44).</p>
            </sec>
            <sec>
                <title>Gender</title>
                <p>As shown in <xref ref-type="table" rid="table3">Table 3</xref> [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref33">33</xref>], the gender distribution in the population and Internet usage is almost the same, and there is a slight difference for general social networks. Our first key finding is that drug review websites and health Web forums are dominated by female users; the number of female users is almost four times larger than that of male users. TwitterHealth and Google+Health have similar gender ratios when compared to the overall user base of Twitter and Google+.</p>
                <p>The finding that women use health forums much more than men is partially supported by previous research, which shows that women report ill health more frequently than men [<xref ref-type="bibr" rid="ref36">36</xref>]. In contrast, this is not true for Twitter and Google+, which are dominated by news exchanges [<xref ref-type="bibr" rid="ref37">37</xref>].</p>
                <table-wrap position="float" id="table3">
                    <label>Table 3</label>
                    <caption>
                        <p>Gender distribution for TwitterHealth, Google+Health, drug reviews, health forums, compared to other relevant populations.</p>
                    </caption>
                    <table width="671" border="1" cellpadding="7" cellspacing="0" frame="below" rules="groups">
                        <col width="413" />
                        <col width="108" />
                        <col width="108" />
                        <thead>
                            <tr valign="top">
                                <td>Source</td>
                                <td>Females, %</td>
                                <td>Males, %</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Population [<xref ref-type="bibr" rid="ref30">30</xref>]</td>
                                <td>51.05</td>
                                <td>48.95</td>
                            </tr>
                            <tr valign="top">
                                <td>Internet Use [<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                                <td>51.63</td>
                                <td>48.37</td>
                            </tr>
                            <tr valign="top">
                                <td>General social networks [<xref ref-type="bibr" rid="ref11">11</xref>]</td>
                                <td>54.68</td>
                                <td>45.32</td>
                            </tr>
                            <tr valign="top">
                                <td>Twitter [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                                <td>57.00</td>
                                <td>43.00</td>
                            </tr>
                            <tr valign="top">
                                <td>Google+ [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                                <td>37.00</td>
                                <td>63.00</td>
                            </tr>
                            <tr valign="bottom">
                                <td>TwitterHealth<sup>a</sup>
                                </td>
                                <td>51.81</td>
                                <td>48.19</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Google+Health<sup>a</sup>
                                </td>
                                <td>35.36</td>
                                <td>64.64</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Drug review websites<sup>a</sup>
                                </td>
                                <td>78.48</td>
                                <td>21.52</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Health Web forums<sup>a</sup>
                                </td>
                                <td>78.41</td>
                                <td>21.59</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table3fn1">
                            <p>
                                <sup>a</sup>These results are from this work. Results in the rows above are reported in the respective citations.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
            </sec>
            <sec>
                <title>Age</title>
                <p>
                    <xref ref-type="table" rid="table4">Table 4</xref> [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref38">38</xref>] reports the age distribution of users in the studied social outlets and in other relevant sources, to put the results in perspective. Age groups were chosen based on the US census. We therefore understand that the age ranges are not equal, but since our main goal is comparing the demographics of Web-based health-related social outlets to other statistics such as Internet usage, we chose to follow the census age ranges in computer and Internet access. Further, we provide population distribution in the <xref ref-type="table" rid="table4">Table 4</xref> to compare each group size with others. One-fifth of Internet users are in the group 0-17; this percentage drops to approximately 1% for drug review websites and health Web forums. The majority of users on drug review websites are between 45 and 64 years old, and drug reviews have more users over 65 years than any other source; this is expected as older patients use more medications [<xref ref-type="bibr" rid="ref39">39</xref>]. However, the percentage of drug review users above 65 is slightly lower than the percentage of Internet users over 65, which means that older people still have low participation in Health 2.0 sites. Also, the 18-34 age group dominates health Web forums, which is congruent with general social networks usage [<xref ref-type="bibr" rid="ref34">34</xref>]. To summarize, our second key finding is that the participants of health-related social outlets are generally older than those of general-purpose social forums, but still relatively low in the 65+ bracket. This is expected to change in the near future based on the participation statistics in the 45-64 bracket.</p>
                <table-wrap position="float" id="table4">
                    <label>Table 4</label>
                    <caption>
                        <p>Age distribution for Google+Health, drug reviews, health forums, and other relevant populations.</p>
                    </caption>
                    <table width="671" border="1" cellpadding="7" cellspacing="0" frame="below" rules="groups">
                        <col width="167" />
                        <col width="81" />
                        <col width="88" />
                        <col width="88" />
                        <col width="88" />
                        <col width="77" />
                        <thead>
                            <tr valign="top">
                                <td>Source</td>
                                <td>0-17 years, %</td>
                                <td>18-34 years, %</td>
                                <td>35-44 years, %</td>
                                <td>45-64 years, %</td>
                                <td>65+ years, %</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Population [<xref ref-type="bibr" rid="ref30">30</xref>]</td>
                                <td>24.00</td>
                                <td>23.11</td>
                                <td>12.93</td>
                                <td>26.53</td>
                                <td>13.44</td>
                            </tr>
                            <tr valign="top">
                                <td>Internet use [<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                                <td>19.30</td>
                                <td>27.55</td>
                                <td>14.99</td>
                                <td>28.36</td>
                                <td>9.80</td>
                            </tr>
                            <tr valign="top">
                                <td>General social networks [<xref ref-type="bibr" rid="ref34">34</xref>]</td>
                                <td>14.58</td>
                                <td>27.43</td>
                                <td>20.68</td>
                                <td>30.98</td>
                                <td>6.32</td>
                            </tr>
                            <tr valign="top">
                                <td>Google+ [<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                                <td>8.08</td>
                                <td>71.61</td>
                                <td>11.08</td>
                                <td>7.82</td>
                                <td>1.42</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Google+Health<sup>a</sup>
                                </td>
                                <td>3.42</td>
                                <td>53.21</td>
                                <td>21.89</td>
                                <td>19.02</td>
                                <td>2.46</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Drug review websites<sup>a</sup>
                                </td>
                                <td>1.05</td>
                                <td>31.13</td>
                                <td>22.36</td>
                                <td>36.84</td>
                                <td>8.62</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Health Web forums<sup>a</sup>
                                </td>
                                <td>1.03</td>
                                <td>39.80</td>
                                <td>25.81</td>
                                <td>28.95</td>
                                <td>4.41</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table4fn1">
                            <p>
                                <sup>a</sup>These results are from this work. Results in the rows above are reported in the respective citations.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
            </sec>
            <sec>
                <title>Ethnicity</title>
                <p>For the ethnicity and location analyses, we focus on the US population, in order to compare to available US census statistics. <xref ref-type="table" rid="table5">Table 5</xref> [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>] shows the results of our ethnicity analysis. Recall that users&#8217; ethnicity in Google+Health and TwitterHealth is classified using our last name-based classifier. Our third key observation is that blacks are underrepresented in health-related social network discussions (Google+Health, TwitterHealth).</p>
                <table-wrap position="float" id="table5">
                    <label>Table 5</label>
                    <caption>
                        <p>Ethnicity distribution for TwitterHealth, Google+Health, and other relevant populations.</p>
                    </caption>
                    <table width="671" border="1" cellpadding="8" cellspacing="0" rules="groups" frame="hsides">
                        <col width="308" />
                        <col width="78" />
                        <col width="91" />
                        <col width="103" />
                        <col width="90" />
                        <thead>
                            <tr valign="top">
                                <td>Source</td>
                                <td>Asian, %</td>
                                <td>Black, %</td>
                                <td>Hispanic, %</td>
                                <td>White, %</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Population [<xref ref-type="bibr" rid="ref40">40</xref>]</td>
                                <td>4.5</td>
                                <td>12.2</td>
                                <td>15.8</td>
                                <td>65.1</td>
                            </tr>
                            <tr valign="top">
                                <td>Internet use [<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                                <td>5.5</td>
                                <td>11.7</td>
                                <td>13.9</td>
                                <td>67.2</td>
                            </tr>
                            <tr valign="top">
                                <td>General social networks [<xref ref-type="bibr" rid="ref12">12</xref>]</td>
                                <td>5.3</td>
                                <td>12.1</td>
                                <td>14.5</td>
                                <td>66.5</td>
                            </tr>
                            <tr valign="top">
                                <td>Twitter [<xref ref-type="bibr" rid="ref41">41</xref>]</td>
                                <td>N/A</td>
                                <td>9</td>
                                <td>12</td>
                                <td>71</td>
                            </tr>
                            <tr valign="bottom">
                                <td>TwitterHealth<sup>a</sup>
                                </td>
                                <td>3.24</td>
                                <td>0.3</td>
                                <td>23.5</td>
                                <td>73.0</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Google+Health<sup>a</sup>
                                </td>
                                <td>5.6</td>
                                <td>0.3</td>
                                <td>17.4</td>
                                <td>76.6</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table5fn1">
                            <p>
                                <sup>a</sup>These results are from this work. Results in the rows above are reported in the respective citations.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
            </sec>
            <sec>
                <title>Location</title>
                <p>Location is reported in four sources: the two general social networks (TwitterHealth, Google+Health), one drug review website (DailyStrength/Treatments), and one health Web forum (DailyStrength/Forums); approximately 62% of users reported their locations. For TwitterHealth and Google+Health, users report their location using a single string (eg, &#8220;NY, NY&#8221;). Thus, these strings are further processed to obtain structured locations (eg, state: New York, city: New York). In particular, non-alphanumeric characters and extra spaces were removed, and location strings with a frequency less than 14 were removed. This left us with about 60% of TwitterHealth and Google+Health users with location strings. Each location string was mapped to a location (city, state, country) using the Google Geocoding API [<xref ref-type="bibr" rid="ref27">27</xref>]. We focus on US users, and hence we remove users from other countries. DailyStrength/Treatments and DailyStrength/Forums list the user&#8217;s city and state separately; thus, we use the reported state for these sources.</p>
                <p>In <xref ref-type="fig" rid="figure2">Figure 2</xref>, we show the distribution of users for each type of Web-based health-related social outlet, normalized by state population. Panel A shows the distribution of users in health Web forums, Panel B shows the distribution of users in drug reviews websites, Panel C shows the distribution of users in TwitterHealth, and Panel D shows the distribution of users in Google+Health combined.</p>
                <p>To better understand these results, we created <xref ref-type="table" rid="table6">Table 6</xref> [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref45">45</xref>], which shows the correlation across all states between the normalized (by population) number of users in various health-related social outlets and other societal measures (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref> for more details). Our fourth key finding is that users in areas with higher income and more access to health care are more likely to participate in Web-based health-related outlets, and particularly in Web forums and drug review sites, which are the primary social sites for health-related information sharing [<xref ref-type="bibr" rid="ref10">10</xref>]. Further, we see that in Twitter and Google+ the correlation with the number of physicians and education is higher. A reason could be that 59.1% of the 878,194 US active physicians [<xref ref-type="bibr" rid="ref42">42</xref>] participate in these networks [<xref ref-type="bibr" rid="ref46">46</xref>], which is a significant number, as the geolocated subsets of the Google+Health and TwitterHealth datasets contain only 882,207 users in the United States. The high correlation with education may be explained by the high percentage (91%) of Twitter users with college degree or higher [<xref ref-type="bibr" rid="ref47">47</xref>].</p>
                <table-wrap position="float" id="table6">
                    <label>Table 6</label>
                    <caption>
                        <p>Correlation across all states between the normalized (per capita) number of users for each type of health-related social outlets, and each state&#8217;s population, normalized number of Internet users, normalized number of physicians, normalized number of uninsured patients, average annual income, and percentage of population with college degree or higher.</p>
                    </caption>
                    <table width="671" border="1" cellpadding="7" cellspacing="0" frame="below" rules="groups">
                        <col width="228" />
                        <col width="65" />
                        <col width="71" />
                        <col width="80" />
                        <col width="90" />
                        <col width="53" />
                        <thead>
                            <tr valign="top">
                                <td>Correlation</td>
                                <td>Health Web forums</td>
                                <td>Drug review websites</td>
                                <td>TwitterHealth</td>
                                <td>Google+Health</td>
                                <td>Google+</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Internet usage [<xref ref-type="bibr" rid="ref31">31</xref>]</td>
                                <td>0.19</td>
                                <td>0.28</td>
                                <td>0.01</td>
                                <td>-0.01</td>
                                <td>0.00</td>
                            </tr>
                            <tr valign="top">
                                <td>No. of physician [<xref ref-type="bibr" rid="ref42">42</xref>]</td>
                                <td>0.37</td>
                                <td>0.19</td>
                                <td>0.88</td>
                                <td>0.80</td>
                                <td>0.44</td>
                            </tr>
                            <tr valign="top">
                                <td>Uninsured population [<xref ref-type="bibr" rid="ref43">43</xref>]</td>
                                <td>-0.40</td>
                                <td>-0.40</td>
                                <td>-0.17</td>
                                <td>-0.11</td>
                                <td>-0.10</td>
                            </tr>
                            <tr valign="top">
                                <td>Annual income [<xref ref-type="bibr" rid="ref44">44</xref>]</td>
                                <td>0.38</td>
                                <td>0.27</td>
                                <td>0.17</td>
                                <td>0.25</td>
                                <td>0.26</td>
                            </tr>
                            <tr valign="top">
                                <td>Education (ratio of people with a college degree) [<xref ref-type="bibr" rid="ref45">45</xref>]</td>
                                <td>0.35</td>
                                <td>0.22</td>
                                <td>0.56</td>
                                <td>0.63</td>
                                <td>0.54</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <fig id="figure2" position="float">
                    <label>Figure 2</label>
                    <caption>
                        <p>Per state capita number of users in (A) health web forums, (B) drug review websites, (C) TwitterHealth, and (D) Google+Health.</p>
                    </caption>
                    <graphic xlink:href="jmir_v17i8e194_fig2.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Writing Level</title>
                <p>The writing level, as previously mentioned, is measured using a standard reading level formula that assigns a school grade to the given text. For example, when a person writes text at a 5<sup>th</sup> grade reading level, it implies that their writing should be understood by people that have passed the 5<sup>th</sup> grade. <xref ref-type="table" rid="table7">Table 7</xref> reports our results for writing level of health-related social outlet users. We see that Google+Health users have generally higher writing level than the rest sources, which may mean that more of the Google+Health users are professional accounts.</p>
                <p>Next, we try to put these findings in perspective. Unfortunately, related work reports only on reading levels (and not writing levels) of the US population participating in social outlets. Thus, we compare our results in <xref ref-type="table" rid="table7">Table 7</xref> to <xref ref-type="fig" rid="figure3">Figure 3</xref>, which reports the reading level of the general US population [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
                <table-wrap position="float" id="table7">
                    <label>Table 7</label>
                    <caption>
                        <p>Writing level distribution for TwitterHealth, Google+Health, drug reviews, and health forums.</p>
                    </caption>
                    <table width="671" border="1" cellpadding="7" cellspacing="0" frame="below" rules="groups">
                        <col width="283" />
                        <col width="108" />
                        <col width="108" />
                        <col width="116" />
                        <thead>
                            <tr valign="top">
                                <td>Source</td>
                                <td>Age 0-5, %</td>
                                <td>Age 6-9, %</td>
                                <td>Age 10-16, %</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>TwitterHealth</td>
                                <td>37.77</td>
                                <td>51.09</td>
                                <td>11.13</td>
                            </tr>
                            <tr valign="top">
                                <td>Google+Health</td>
                                <td>6.45</td>
                                <td>55.63</td>
                                <td>37.91</td>
                            </tr>
                            <tr valign="top">
                                <td>Drug review websites</td>
                                <td>30.42</td>
                                <td>66.17</td>
                                <td>3.41</td>
                            </tr>
                            <tr valign="top">
                                <td>Health Web forums</td>
                                <td>28.79</td>
                                <td>68.24</td>
                                <td>2.98</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <p>Our fifth key finding is that the writing level in health-related social outlets (<xref ref-type="table" rid="table7">Table 7</xref>) is generally lower than the reading level of the population (<xref ref-type="fig" rid="figure3">Figure 3</xref>). Thus users/patients can easily comprehend the posts and hence benefit from the experiences of other users. The benefit of social interaction with respect to health empowerment has been demonstrated before [<xref ref-type="bibr" rid="ref48">48</xref>]. In an online epilepsy community, 59% of patients found another patient experiencing the same symptoms, 58% had a better understanding of seizures, and 55% learned more about treatments and symptoms.</p>
                <fig id="figure3" position="float">
                    <label>Figure 3</label>
                    <caption>
                        <p>Reading level of US population.</p>
                    </caption>
                    <graphic xlink:href="jmir_v17i8e194_fig3.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Statistical Significance Tests</title>
                <p>
                    <xref ref-type="table" rid="table8">Tables 8</xref> and <xref ref-type="table" rid="table9">9</xref> report the <italic>P</italic> values for Pearson&#8217;s chi-square test of independence and the Mann-Whitney U test. Note that we compute only significance values between sources that we have analyzed and not between our sources and sources analyzed by other works (such as Google+ [<xref ref-type="bibr" rid="ref38">38</xref>]), since we do not have the raw data for those sources.</p>
                <table-wrap position="float" id="table8">
                    <label>Table 8</label>
                    <caption>
                        <p>
                            <italic>P</italic> values for Pearson&#8217;s chi-square test of independence.</p>
                    </caption>
                    <table width="671" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="180" />
                        <col width="90" />
                        <col width="90" />
                        <col width="90" />
                        <col width="90" />
                        <thead>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Gender</td>
                                <td>Age</td>
                                <td>Ethnicity</td>
                                <td>Writing level</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>TwitterHealth vs Google+Health</td>
                                <td>&#60;.001</td>
                                <td>N/A</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                            </tr>
                            <tr valign="top">
                                <td>TwitterHealth vs Health Web forums</td>
                                <td>&#60;.001</td>
                                <td>N/A</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                            </tr>
                            <tr valign="top">
                                <td>TwitterHealth vs Drug review websites</td>
                                <td>&#60;.001</td>
                                <td>N/A</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                            </tr>
                            <tr valign="top">
                                <td>Google+Health vs Health Web forums</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                            </tr>
                            <tr valign="top">
                                <td>Google+Health vs Drug review websites</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                            </tr>
                            <tr valign="top">
                                <td>Health Web forums vs Drug review websites</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap position="float" id="table9">
                    <label>Table 9</label>
                    <caption>
                        <p>
                            <italic>P</italic> values for Mann-Whitney U test.</p>
                    </caption>
                    <table width="671" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="10" />
                        <col width="60" />
                        <col width="80" />
                        <col width="82" />
                        <col width="83" />
                        <col width="89" />
                        <col width="90" />
                        <col width="68" />
                        <thead>
                            <tr valign="top">
                                <td colspan="2">
                                    <break />
                                </td>
                                <td>TwitterHealth vs Google+Health</td>
                                <td>TwitterHealth vs Health Web forums</td>
                                <td>TwitterHealth vs Drug review websites</td>
                                <td>Google+Health vs Health Web forums</td>
                                <td>Google+Health vs Drug review websites</td>
                                <td>Health Web forums vs Drug review websites</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td colspan="8">
                                    <bold>Gender</bold>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Male</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>.5797</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Female</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>.5797</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="8">
                                    <bold>Age</bold>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>0-17</td>
                                <td>N/A</td>
                                <td>N/A</td>
                                <td>N/A</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>.5144</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>18-34</td>
                                <td>N/A</td>
                                <td>N/A</td>
                                <td>N/A</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>35-44</td>
                                <td>N/A</td>
                                <td>N/A</td>
                                <td>N/A</td>
                                <td>.01661</td>
                                <td>.7747</td>
                                <td>&#60;.001</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>45-64</td>
                                <td>N/A</td>
                                <td>N/A</td>
                                <td>N/A</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>&#8805;65</td>
                                <td>N/A</td>
                                <td>N/A</td>
                                <td>N/A</td>
                                <td>.01066</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="8">
                                    <bold>Ethnicity</bold>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>White</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>.1316</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Black</td>
                                <td>.6339</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>.0944</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Asian</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.01</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>.8054</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Hispanic</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>.6503</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="8">
                                    <bold>Writing level</bold>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>0-5</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>6-9</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>10-16</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>&#60;.001</td>
                                <td>.00516</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <sec>
                <title>Principal Findings</title>
                <p>Our results can help health care providers customize educational campaigns for different groups. For example, white women should be informed to a larger extent on the possible misinformation spreading in health Web forums, since they participate much more.</p>
                <p>Regarding mitigating ethnicity-based health care disparities, we found that Twitter and Google+ are more effective in reaching out to Hispanics about health care offerings. However, this is not true for black ethnicity, who are not overrepresented in any health-related social outlet. This means that there is no single outlet to reach black population, which has been shown to receive worse health care by about 40% comparing to white population [<xref ref-type="bibr" rid="ref49">49</xref>].</p>
                <p>Advertisers may use our results to decide on the best sites to advertise their products; for instance, drug review websites are more appropriate than Google+ to advertise drugs for the 45-64 age bracket, but the opposite is true for the 18-34 age bracket. Further, drug review websites and health Web forums are better to target females when advertising for their products than other health-related social outlets.</p>
                <p>In the age results section, we found that younger groups (18-34 years old) participate in large numbers in health forums, which may sound counterintuitive. By analyzing posts for this age bracket, we found the most popular keywords are related to pregnancy such as birth control, ovulation, and miscarriage. On the other hand, their participation is lower for drug review websites. A possible explanation may be that often patients who talk about pregnancy are not taking any drugs, compared to other conditions like diabetes, where drugs are more common.</p>
                <p>We also attempt to explain the disparities in the participation in health-related social outlets based on socioeconomic factors through the state-level participation distributions. Our results in <xref ref-type="table" rid="table6">Table 6</xref> show that less access to physicians does not lead to higher participation in health-related social outlets as one would expect. In contrast, it seems that the participation in such outlets is correlated with the access to health care and the average income.</p>
                <p>The weak but positive correlation between income and participation to health Web forums and drug review sites may be partially attributed to the higher Internet usage of the more affluent groups, as shown in <xref ref-type="table" rid="table6">Table 6</xref>. Another possible explanation is that lower income or uninsured persons are more likely to be part of a community with health care disparities [<xref ref-type="bibr" rid="ref50">50</xref>].The positive correlation between education and participation in health-related social outlets, especially Google+Health and TwitterHealth, may be partially explained by the fact that people with college degrees are less likely to be uninsured, since 10% of college graduates are uninsured, compared to 40% of adults who have not graduated from high school [<xref ref-type="bibr" rid="ref51">51</xref>]. In addition, 60% of uninsured people are from families with low incomes [<xref ref-type="bibr" rid="ref51">51</xref>], and the group of people with income lower than US 30K is the lowest group in terms of accessing health information [<xref ref-type="bibr" rid="ref52">52</xref>], Hence, our results show that people with low income have less access to health information.</p>
                <p>On the other hand, we found that the content in health-related social outlets is easy to understand for almost all users, given the low writing level. That is, the well-known health literacy issue, which is more severe in low-income and lower education populations [<xref ref-type="bibr" rid="ref5">5</xref>], does not seem to apply to Web-based health-related social outlets. Of course, the low writing level does not address the issue of language, as many low income and low education users in the United States do not speak English at home [<xref ref-type="bibr" rid="ref53">53</xref>].</p>
            </sec>
            <sec>
                <title>Limitations</title>
                <p>Our ethnicity and gender classifiers are not perfect, as shown in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>, and thus introduce an error into our analyses. This issue is less significant for gender, since out of all users included in our gender analysis for health Web forums and drug review websites, a majority of the users (over 94%) report their gender, and hence the classifier was only used for 6% of users. Further, a majority of users in drug review websites and health Web forums are female, and our gender classifier obtained an accuracy greater than 99% for females when using a screen name.</p>
                <p>Another limitation is the informal writing style of social media posts, as our writing level method uses the average sentence length, which expects that posts are properly punctuated. We addressed this limitation to some degree by only considering sentences of a reasonable length (less than 30 words). Estimating writing level could have been improved by considering other features like typos or spelling mistakes. Further, it would be useful to measure the quality of the posted information, in addition to just the writing level. This is a challenging issue, which we leave as future work.</p>
                <p>Since all the attributes are reported by users, there is inevitably self-selection bias. In particular, gender, age, and location are not mandatory in any site. For instance, older people may choose not to report their age. Moreover, choosing to report the real names or posting profile pictures could also create self-selection bias in our gender and ethnicity classifiers. There may also be various types or degrees of bias across different outlets. For instance, WebMD users may use their real name less frequently than Twitter users. This in turn may bias the study results, especially for ethnicity where we depend completely on the classifier results.</p>
            </sec>
            <sec>
                <title>Conclusion</title>
                <p>We studied user demographics in Web-based health-related social outlets, which we split into three different types: social networks, drug review websites, and health Web forums. The distributions of the demographic attributes&#8212;gender, age, ethnicity, location, and writing level&#8212;have been analyzed for each source type and compared with relevant baseline user distributions like Internet and general social outlets participation. The results reveal interesting and often unexpected disparities with respect to all demographic attributes.</p>
            </sec>
        </sec>
    </body>
    <back>
        <app-group>
            <app id="app1">
                <title>Multimedia Appendix 1</title>
                <p>Online social outlets summary, health keywords, classifiers evaluation, and data coverage.</p>
                <media xlink:href="jmir_v17i8e194_app1.pdf" xlink:title="PDF File (Adobe PDF File), 36KB" />
            </app>
        </app-group>
        <glossary>
            <title>Abbreviations</title>
            <def-list>
                <def-item>
                    <term id="abb1">API</term>
                    <def>
                        <p>application programming interface</p>
                    </def>
                </def-item>
            </def-list>
        </glossary>
        <ack>
            <p>This project was partially supported by National Science Foundation (NSF) grants IIS-1216007, IIS-1447826, and IIP-1448848. Any opinions, findings and conclusions or recommendations expressed in this material are those of the authors and do not necessarily reflect the views of the National Science Foundation (NSF).</p>
        </ack>
        <fn-group>
            <fn fn-type="con">
                <p>All authors contributed substantially to this work. They designed and performed the analysis and approved the final version of this manuscript.</p>
            </fn>
            <fn fn-type="conflict">
                <p>None declared.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="web">
                    <source>ECRI</source>
                    <year>2011</year>
                    <access-date>2015-02-02</access-date>
                    <comment>Social media in healthcare<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://kcmsociety.org/wp-content/uploads/2013/04/ECRI-social-media.pdf">http://kcmsociety.org/wp-content/uploads/2013/04/ECRI-social-media.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W1rk2Yt2</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="web">
                    <source>Giving benefits the YouTube treatment - workplace benefits association</source>
                    <year>2008</year>
                    <access-date>2015-01-31</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.workplacebenefits.org/news/giving-benefits-youtube-treatment-711171-1.html">http://www.workplacebenefits.org/news/giving-benefits-youtube-treatment-711171-1.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6Vyr2D7tA</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="web">
                    <source>Health Disparities</source>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.medicaid.gov/Medicaid-CHIP-Program-Information/By-Topics/Data-and-Systems/Health-Disparities.html">http://www.medicaid.gov/Medicaid-CHIP-Program-Information/By-Topics/Data-and-Systems/Health-Disparities.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W1rr2Maq</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Frieden</surname>
                            <given-names>TR</given-names>
                        </name>
                        <collab>Centers for Disease Control and Prevention (CDC)</collab>
                    </person-group>
                    <article-title>Forward: CDC Health Disparities and Inequalities Report - United States, 2011</article-title>
                    <source>MMWR Surveill Summ</source>
                    <year>2011</year>
                    <month>01</month>
                    <day>14</day>
                    <volume>60 Suppl</volume>
                    <fpage>1</fpage>
                    <lpage>2</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.cdc.gov/mmwr/preview/mmwrhtml/su6001a1.htm" />
                    </comment>
                    <pub-id pub-id-type="medline">21430612</pub-id>
                    <pub-id pub-id-type="pii">su6001a1</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Gibbons</surname>
                            <given-names>MC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Fleisher</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Slamon</surname>
                            <given-names>RE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bass</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kandadai</surname>
                            <given-names>V</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Beck</surname>
                            <given-names>JR</given-names>
                        </name>
                    </person-group>
                    <article-title>Exploring the potential of Web 2.0 to address health disparities</article-title>
                    <source>J Health Commun</source>
                    <year>2011</year>
                    <volume>16 Suppl 1</volume>
                    <fpage>77</fpage>
                    <lpage>89</lpage>
                    <pub-id pub-id-type="doi">10.1080/10810730.2011.596916</pub-id>
                    <pub-id pub-id-type="medline">21843097</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kane</surname>
                            <given-names>GC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Fichman</surname>
                            <given-names>RG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gallaugher</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Glaser</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Community relations 2.0</article-title>
                    <source>Harv Bus Rev</source>
                    <year>2009</year>
                    <month>11</month>
                    <volume>87</volume>
                    <issue>11</issue>
                    <fpage>45</fpage>
                    <lpage>50, 132</lpage>
                    <pub-id pub-id-type="medline">19891388</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hackworth</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kunz</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Health care and social media: building relationships via social networks</article-title>
                    <source>Acad Heal Care J</source>
                    <year>2010</year>
                    <volume>6</volume>
                    <issue>1</issue>
                    <fpage>55</fpage>
                    <lpage>69</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.thefreelibrary.com/403.htm" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Denecke</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nejdl</surname>
                            <given-names>W</given-names>
                        </name>
                    </person-group>
                    <article-title>How valuable is medical social media data? Content analysis of the medical web</article-title>
                    <source>Information Sciences</source>
                    <year>2009</year>
                    <month>05</month>
                    <day>30</day>
                    <volume>179</volume>
                    <issue>12</issue>
                    <fpage>1870</fpage>
                    <lpage>1880</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.ins.2009.01.025</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lu</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Liu</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Deng</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>Health-related hot topic detection in online communities using text clustering</article-title>
                    <source>PLoS One</source>
                    <year>2013</year>
                    <volume>8</volume>
                    <issue>2</issue>
                    <fpage>e56221</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0056221" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0056221</pub-id>
                    <pub-id pub-id-type="medline">23457530</pub-id>
                    <pub-id pub-id-type="pii">PONE-D-12-27785</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3574139</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wiley</surname>
                            <given-names>MT</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jin</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hristidis</surname>
                            <given-names>V</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Esterling</surname>
                            <given-names>KM</given-names>
                        </name>
                    </person-group>
                    <article-title>Pharmaceutical drugs chatter on Online Social Networks</article-title>
                    <source>J Biomed Inform</source>
                    <year>2014</year>
                    <month>06</month>
                    <volume>49</volume>
                    <fpage>245</fpage>
                    <lpage>54</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S1532-0464(14)00063-X" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1016/j.jbi.2014.03.006</pub-id>
                    <pub-id pub-id-type="medline">24637141</pub-id>
                    <pub-id pub-id-type="pii">S1532-0464(14)00063-X</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="web">
                    <source>Pew Research Center&#8217;s Internet &#38; American Life Project</source>
                    <comment>Social Networking Fact Sheet<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/fact-sheets/social-networking-fact-sheet/">http://www.pewinternet.org/fact-sheets/social-networking-fact-sheet/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W22L3O2w</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="web">
                    <source>eMarketer</source>
                    <year>2013</year>
                    <access-date>2015-02-02</access-date>
                    <comment>Health care and social media: bulding relationships via social networks<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.emarketer.com/Article/Hispanic-Shoppers-Bring-Social-Mobile-Habits-Grocery-Aisle/1009839">http://www.emarketer.com/Article/Hispanic-Shoppers-Bring-Social-Mobile-Habits-Grocery-Aisle/1009839</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W21kTHSr</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mislove</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lehmann</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ahn</surname>
                            <given-names>Y</given-names>
                        </name>
                    </person-group>
                    <source>AAAI</source>
                    <year>2011</year>
                    <access-date>2015-06-14</access-date>
                    <comment>Understanding the demographics of Twitter users<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.ccs.neu.edu/home/amislove/publications/Twitter-ICWSM.pdf">http://www.ccs.neu.edu/home/amislove/publications/Twitter-ICWSM.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6ZHoYQIfV</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mandel</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Culotta</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Boulahanis</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>A demographic analysis of online sentiment during hurricane irene</article-title>
                    <source>Language in Social Media</source>
                    <year>2012</year>
                    <fpage>27</fpage>
                    <lpage>36</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dl.acm.org/citation.cfm?id=2390378" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>Harvard</collab>
                    </person-group>
                    <source>The literacy problem</source>
                    <access-date>2015-06-14</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://cdn1.sph.harvard.edu/wp-content/uploads/sites/135/2012/09/doakchap1-4.pdf">http://cdn1.sph.harvard.edu/wp-content/uploads/sites/135/2012/09/doakchap1-4.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6ZHoudAjI</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="web">
                    <source>Twitter, Inc</source>
                    <access-date>2015-08-01</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://twitter.com/">https://twitter.com/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6aTENJsel</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="web">
                    <source>Google+</source>
                    <access-date>2015-08-01</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://accounts.google.com/ServiceLogin?service=oz&#38;passive=1209600&#38;continue=https://plus.google.com/?gpsrc%3Dgplp0">https://accounts.google.com/ServiceLogin?service=oz&#38;passive=1209600&#38;continue=https://plus.google.com/?gpsrc%3Dgplp0</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6aTEQOvFn</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <nlm-citation citation-type="web">
                    <source>Drugs.com</source>
                    <access-date>2015-02-02</access-date>
                    <comment>Prescription Drug Information, Interactions &#38; Side Effects<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.drugs.com/">http://www.drugs.com/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W23lHwlt</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <nlm-citation citation-type="web">
                    <source>DailyStrength</source>
                    <access-date>2015-02-02</access-date>
                    <comment>Treatments: reviews of drugs, therapies and remedies by everyday people<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.dailystrength.org/treatments">http://www.dailystrength.org/treatments</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W23nXoJa</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <nlm-citation citation-type="web">
                    <source>WebMD Drugs &#38; Treatments - Medical Information and user ratings on prescription drugs and over-the-counter (OTC) medications</source>
                    <access-date>2015-02-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.webmd.com/drugs/index-drugs.aspx">http://www.webmd.com/drugs/index-drugs.aspx</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W23rKUfB</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <nlm-citation citation-type="web">
                    <source>Drugs.com</source>
                    <access-date>2015-02-02</access-date>
                    <comment>Medical Questions Answered<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.drugs.com/answers/">http://www.drugs.com/answers/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W23vDAi5</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <nlm-citation citation-type="web">
                    <source>DailyStrength</source>
                    <access-date>2015-02-02</access-date>
                    <comment>Online Support Groups<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.dailystrength.org/support-groups">http://www.dailystrength.org/support-groups</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W23ztpRe</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <nlm-citation citation-type="web">
                    <source>WebMD - Better information</source>
                    <access-date>2015-02-02</access-date>
                    <comment>Better health<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.webmd.com/">http://www.webmd.com/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W247u0HQ</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <nlm-citation citation-type="web">
                    <source>The Flesch grade level readability formula</source>
                    <access-date>2015-02-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.readabilityformulas.com/flesch-grade-level-readability-formula.php">http://www.readabilityformulas.com/flesch-grade-level-readability-formula.php</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W22mEB3h</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <nlm-citation citation-type="web">
                    <source>RxList - The Internet Drug Index for prescription drugs, medications and pill</source>
                    <access-date>2015-02-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.rxlist.com/script/main/hp.asp">http://www.rxlist.com/script/main/hp.asp</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W24Layfl</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <nlm-citation citation-type="web">
                    <source>The Streaming APIs &#124; Twitter Developers</source>
                    <access-date>2015-06-14</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://dev.twitter.com/streaming/overview">https://dev.twitter.com/streaming/overview</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6ZHpD7gjO</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <nlm-citation citation-type="web">
                    <source>Google+ API - Google+ Platform &#8212; Google Developers</source>
                    <access-date>2015-02-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://developers.google.com/+/api/">https://developers.google.com/+/api/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W24x2YYc</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <nlm-citation citation-type="web">
                    <source>jsoup Java HTML Parser, with best of DOM, CSS, and jquery</source>
                    <access-date>2015-02-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jsoup.org/">http://jsoup.org/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W2528eFu</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref29">
                <label>29</label>
                <nlm-citation citation-type="web">
                    <source>Top names over the last 100 years</source>
                    <access-date>2015-02-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.ssa.gov/oact/babynames/decades/century.html">http://www.ssa.gov/oact/babynames/decades/century.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W25cpwBx</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref30">
                <label>30</label>
                <nlm-citation citation-type="web">
                    <source>U.S. Census Bureau Demographic Internet Staff</source>
                    <year>2012</year>
                    <access-date>2015-02-02</access-date>
                    <comment>Age and sex composition in the United States<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.census.gov/population/age/data/2012comp.html">https://www.census.gov/population/age/data/2012comp.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W25iCZh0</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref31">
                <label>31</label>
                <nlm-citation citation-type="web">
                    <source>U.S. Census Bureau Demographic Internet Staff</source>
                    <year>2012</year>
                    <access-date>2015-02-02</access-date>
                    <comment>Computer and internet access in the United States<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.census.gov/hhes/computer/publications/2012.html">https://www.census.gov/hhes/computer/publications/2012.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W271RtOB</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref32">
                <label>32</label>
                <nlm-citation citation-type="web">
                    <source>US Census Bureau Data Integration Division</source>
                    <access-date>2015-02-02</access-date>
                    <comment>Genealogy Data - Frequently occurring surnames from Census 2000 - US Census Bureau<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.census.gov/topics/population/genealogy/data/2000_surnames.html">http://www.census.gov/topics/population/genealogy/data/2000_surnames.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W27P3i6N</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref33">
                <label>33</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Smith</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <source>User demographics of the major social networks</source>
                    <year>2012</year>
                    <access-date>2015-02-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://expandedramblings.com/index.php/user-demographics-of-the-major-social-networks-infographic/">http://expandedramblings.com/index.php/user-demographics-of-the-major-social-networks-infographic/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W27uwrNE</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref34">
                <label>34</label>
                <nlm-citation citation-type="web">
                    <source>April 2011: The Days of Double-Digit Growth in Social Network Users Are Over</source>
                    <access-date>2015-02-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.iab.net/research/industry_data_and_landscape/1675/1644724">http://www.iab.net/research/industry_data_and_landscape/1675/1644724</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W284mBJz</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref35">
                <label>35</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Finn</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <source>Behind The Numbers Of Google+&#039;s Monumental Rise To 25 Million Visitors</source>
                    <year>2011</year>
                    <access-date>2015-02-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://searchengineland.com/behind-the-numbers-of-googles-monumental-rise-to-25-million-unique-visitor-88076">http://searchengineland.com/behind-the-numbers-of-googles-monumental-rise-to-25-million-unique-visitor-88076</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W28agd5M</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref36">
                <label>36</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ashley</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <source>BBC News - Women more likely to report ill health than men</source>
                    <year>2010</year>
                    <access-date>2015-02-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://news.bbc.co.uk/2/hi/health/8588686.stm">http://news.bbc.co.uk/2/hi/health/8588686.stm</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W28nDUGK</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref37">
                <label>37</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kwak</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lee</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Park</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Moon</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>What is Twitter, a Social Network or a News Media?</article-title>
                    <source>ACM</source>
                    <year>2010</year>
                    <month>04</month>
                    <fpage>591</fpage>
                    <lpage>600</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.ambuehler.ethz.ch/CDstore/www2010/www/p591.pdf" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref38">
                <label>38</label>
                <nlm-citation citation-type="web">
                    <source>The comprehensive resource for Google+ trends and statistics</source>
                    <access-date>2015-02-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.gplusdata.com/users/sign_in">http://www.gplusdata.com/users/sign_in</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W29H2CHP</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref39">
                <label>39</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Gu</surname>
                            <given-names>Q</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dillon</surname>
                            <given-names>CF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Burt</surname>
                            <given-names>VL</given-names>
                        </name>
                    </person-group>
                    <article-title>Prescription drug use continues to increase: U.S. prescription drug data for 2007-2008</article-title>
                    <source>NCHS Data Brief</source>
                    <year>2010</year>
                    <month>09</month>
                    <issue>42</issue>
                    <fpage>1</fpage>
                    <lpage>8</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.cdc.gov/nchs/data/databriefs/db42.pdf" />
                    </comment>
                    <pub-id pub-id-type="medline">20854747</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref40">
                <label>40</label>
                <nlm-citation citation-type="web">
                    <source>US Census Bureau</source>
                    <year>2012</year>
                    <access-date>2015-02-01</access-date>
                    <comment>Statistical abstract of the United States - Section 1<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.census.gov/prod/2011pubs/12statab/pop.pdf">http://www.census.gov/prod/2011pubs/12statab/pop.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W29OSGmX</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref41">
                <label>41</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bennett</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <source>Twitter, Facebook and LinkedIn: age, ethnicity and gender of the major social networks</source>
                    <year>2011</year>
                    <access-date>2015-02-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.adweek.com/socialtimes/pew-social-network-age-ethnicity-gender/453165?red=at">http://www.adweek.com/socialtimes/pew-social-network-age-ethnicity-gender/453165?red=at</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W2A8l2Cu</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref42">
                <label>42</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Young</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chaudhry</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Thomas</surname>
                            <given-names>JV</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dugan</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>A census of actively licensed physicians in the United States</article-title>
                    <source>J Med Regul</source>
                    <year>2012</year>
                    <volume>99</volume>
                    <fpage>11</fpage>
                    <lpage>24</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.fsmb.org/Media/Default/PDF/Census/census.pdf" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref43">
                <label>43</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Denavas-walt</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Proctor</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Smith</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <source>US Census Bureau, Current Population Reports</source>
                    <year>2013</year>
                    <access-date>2015-02-02</access-date>
                    <publisher-loc>Washington, DC</publisher-loc>
                    <comment>Income, poverty, and health insurance coverage in the United States<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.census.gov/prod/2013pubs/p60-245.pdf">http://www.census.gov/prod/2013pubs/p60-245.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W2D1eglk</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref44">
                <label>44</label>
                <nlm-citation citation-type="web">
                    <source>US Census Bureau Data Integration Division</source>
                    <access-date>2015-02-02</access-date>
                    <comment>Income<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.census.gov/hhes/www/income/data/statemedian/">http://www.census.gov/hhes/www/income/data/statemedian/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W2D9aO6n</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref45">
                <label>45</label>
                <nlm-citation citation-type="web">
                    <source>US Census Bureau</source>
                    <year>2012</year>
                    <access-date>2015-02-02</access-date>
                    <comment>Statistical abstract of the United States - Section 4<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.census.gov/prod/2011pubs/12statab/educ.pdf">http://www.census.gov/prod/2011pubs/12statab/educ.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W2DHYzQJ</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref46">
                <label>46</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cooper</surname>
                            <given-names>CP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gelb</surname>
                            <given-names>CA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rim</surname>
                            <given-names>SH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hawkins</surname>
                            <given-names>NA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rodriguez</surname>
                            <given-names>JL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Polonec</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Physicians who use social media and other internet-based communication technologies</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2012</year>
                    <volume>19</volume>
                    <issue>6</issue>
                    <fpage>960</fpage>
                    <lpage>4</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=22634078" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000628</pub-id>
                    <pub-id pub-id-type="medline">22634078</pub-id>
                    <pub-id pub-id-type="pii">amiajnl-2011-000628</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3534450</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref47">
                <label>47</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hampton</surname>
                            <given-names>KN</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Goulet</surname>
                            <given-names>LS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rainie</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Purcell</surname>
                            <given-names>K</given-names>
                        </name>
                    </person-group>
                    <source>Pew Research Center&#8217;s Internet &#38; American Life Project</source>
                    <year>2011</year>
                    <month>06</month>
                    <day>16</day>
                    <access-date>2015-08-01</access-date>
                    <comment>Social networking sites and our lives<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/2011/06/16/social-networking-sites-and-our-lives/">http://www.pewinternet.org/2011/06/16/social-networking-sites-and-our-lives/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6aTEsGHIL</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref48">
                <label>48</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wicks</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Keininger</surname>
                            <given-names>DL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Massagli</surname>
                            <given-names>MP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>de la Loge</surname>
                            <given-names>Christine</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brownstein</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Isoj&#228;rvi</surname>
                            <given-names>Jouko</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Heywood</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Perceived benefits of sharing health data between people with epilepsy on an online platform</article-title>
                    <source>Epilepsy Behav</source>
                    <year>2012</year>
                    <month>01</month>
                    <volume>23</volume>
                    <issue>1</issue>
                    <fpage>16</fpage>
                    <lpage>23</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S1525-5050(11)00560-9" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1016/j.yebeh.2011.09.026</pub-id>
                    <pub-id pub-id-type="medline">22099528</pub-id>
                    <pub-id pub-id-type="pii">S1525-5050(11)00560-9</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref49">
                <label>49</label>
                <nlm-citation citation-type="web">
                    <source>Agency for Healthcare Research &#38; Quality (AHRQ)</source>
                    <year>2014</year>
                    <access-date>2015-06-14</access-date>
                    <comment>Disparities in healthcare quality among racial and ethnic minority groups<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.ahrq.gov/research/findings/nhqrdr/nhqrdr10/minority.html">http://www.ahrq.gov/research/findings/nhqrdr/nhqrdr10/minority.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6ZHq5iyFV</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref50">
                <label>50</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mendes</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <source>Gallup poll</source>
                    <year>2010</year>
                    <access-date>2015-02-02</access-date>
                    <comment>In US, health disparities across incomes are wide-ranging<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.gallup.com/poll/143696/health-disparities-across-incomes-wide-ranging.aspx">http://www.gallup.com/poll/143696/health-disparities-across-incomes-wide-ranging.aspx</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W2E9gDMj</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref51">
                <label>51</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Adler</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Newman</surname>
                            <given-names>K</given-names>
                        </name>
                    </person-group>
                    <article-title>Socioeconomic Disparities In Health: Pathways And Policies</article-title>
                    <source>Health Affairs</source>
                    <year>2002</year>
                    <month>03</month>
                    <day>01</day>
                    <volume>21</volume>
                    <issue>2</issue>
                    <fpage>60</fpage>
                    <lpage>76</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://content.healthaffairs.org/content/21/2/60.short" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1377/hlthaff.21.2.60</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref52">
                <label>52</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Madden</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <source>Pew Research Center</source>
                    <year>2013</year>
                    <access-date>2015-06-14</access-date>
                    <comment>Technology use by different income groups<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/2013/05/29/technology-use-by-different-income-groups/">http://www.pewinternet.org/2013/05/29/technology-use-by-different-income-groups/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6ZHs8GsTY</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref53">
                <label>53</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ryan</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <source>US Census Bureau</source>
                    <year>2013</year>
                    <access-date>2015-02-01</access-date>
                    <comment>Language Use in the United States<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.census.gov/prod/2013pubs/acs-22.pdf">http://www.census.gov/prod/2013pubs/acs-22.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6W2EHGxIj</pub-id>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>
