<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">JMIR</journal-id>
            <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
            <journal-title>Journal of Medical Internet Research</journal-title>
            <issn pub-type="epub">1438-8871</issn>
            <publisher>
                <publisher-name>Gunther Eysenbach</publisher-name>
                <publisher-loc>Centre for Global eHealth Innovation, Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v7i3e36</article-id>
            <article-id pub-id-type="pmid">15998627</article-id>
            <article-id pub-id-type="doi">10.2196/jmir.7.3.e36</article-id>
            <article-categories>
                <subj-group subj-group-type="article-type">
                    <subject>Original Paper</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Cancer Internet Search Activity on a Major Search Engine, United States 2001-2003</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1">
                    <name name-style="western">
                        <surname>Cooper</surname>
                        <given-names>Crystale Purvis</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                </contrib>
                <contrib contrib-type="author" id="contrib2">
                    <name name-style="western">
                        <surname>Mallon</surname>
                        <given-names>Kenneth P</given-names>
                    </name>
                    <degrees>MS</degrees>
                    <degrees>MHS</degrees>
                    <xref ref-type="aff" rid="aff2">2</xref>
                </contrib>
                <contrib contrib-type="author" id="contrib3">
                    <name name-style="western">
                        <surname>Leadbetter</surname>
                        <given-names>Steven</given-names>
                    </name>
                    <degrees>MS</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                </contrib>
                <contrib contrib-type="author" id="contrib4" corresp="yes">
                    <name name-style="western">
                        <surname>Pollack</surname>
                        <given-names>Lori A</given-names>
                    </name>
                    <degrees>MD</degrees>
                    <degrees>MPH</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                    <address>
                        <institution>Centers for Disease Control and Prevention</institution>
                        <addr-line>4770 Buford Hwy, NE, MS K-55</addr-line>
                        <addr-line>Atlanta, GA 30341</addr-line>
                        <country>USA</country>
                        <phone>+1 770 457 3181</phone>
                        <fax>+1 770 488 4639</fax>
                        <email>lpollack@cdc.gov</email>
                    </address>
                </contrib>
                <contrib contrib-type="author" id="contrib5">
                    <name name-style="western">
                        <surname>Peipins</surname>
                        <given-names>Lucy A</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                </contrib>
             </contrib-group>
            <contrib-group>
                  <contrib contrib-type="reviewer">
                    <name>
                        <surname>Jansen</surname>
                        <given-names>Jim</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <aff id="aff2" rid="aff2">
                <sup>2</sup>
                <addr-line>Yahoo! Inc (at the time of this study)</addr-line>
                <country>Dynamic Logic (at present)</country>
            </aff>
            <aff id="aff1" rid="aff1">
                <sup>1</sup>
                <addr-line>Division of Cancer Prevention and Control</addr-line>
                <institution>National Center for Chronic Disease Prevention and Health Promotion</institution>
                <institution>Centers for Disease Control and Prevention</institution>
                <addr-line>Atlanta</addr-line>
                <addr-line>GA</addr-line>
                <country>USA</country>
            </aff>
            <pub-date pub-type="collection">
                <season>Jul-Aug</season>
                <year>2005</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>1</day>
                <month>7</month>
                <year>2005</year>
            </pub-date>
            <volume>7</volume>
            <issue>3</issue>
            <elocation-id>e36</elocation-id>
            <history>
                <date date-type="received">
                    <day>29</day>
                    <month>4</month>
                    <year>2005</year>
                </date>
                <date date-type="rev-request">
                    <day>18</day>
                    <month>5</month>
                    <year>2005</year>
                </date>
                <date date-type="rev-recd">
                    <day>7</day>
                    <month>6</month>
                    <year>2005</year>
                </date>
                <date date-type="accepted">
                    <day>12</day>
                    <month>6</month>
                    <year>2005</year>
                </date>
            </history>
            <copyright-statement>&#xA9; Crystale Purvis Cooper, Kenneth P Mallon, Steven Leadbetter, Lori A Pollack, Lucy A Peipins.  Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 1.7.2005.  Except where otherwise noted, articles published in the Journal of Medical Internet Research are distributed under the terms of the Creative Commons Attribution License (http://www.creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited, including full bibliographic	details and the URL (see "please cite as" above), and this statement is included.</copyright-statement>
            <copyright-year>2005</copyright-year>
            <self-uri xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2005/3/e36/"/>
            <abstract>
                <sec sec-type="background">
                    <title>Background</title>
                    <p> To locate online health information, Internet users typically use a search engine, such as Yahoo! or Google. We studied Yahoo! search activity related to the 23 most common cancers in the United States.</p>
                </sec>
                <sec sec-type="objective">
                    <title>Objective</title>
                    <p> The objective was to test three potential correlates of Yahoo! cancer search activity&#x2014;estimated cancer incidence, estimated cancer mortality, and the volume of cancer news coverage&#x2014;and to study the periodicity of and peaks in Yahoo! cancer search activity.</p>
                </sec>
                <sec sec-type="methods">
                    <title>Methods</title>
                    <p> Yahoo! cancer search activity was obtained from a proprietary database called the Yahoo! Buzz Index. The American Cancer Society's estimates of cancer incidence and mortality were used. News reports associated with specific cancer types were identified using the LexisNexis &#x201C;US News&#x201D; database, which includes more than 400 national and regional newspapers and a variety of newswire services.</p>
                </sec>
                <sec sec-type="results">
                    <title>Results</title>
                    <p> The Yahoo! search activity associated with specific cancers correlated with their estimated incidence (Spearman rank correlation, &#x3C1; = 0.50, <italic>P</italic> = .015), estimated mortality (&#x3C1; = 0.66, <italic>P</italic> = .001), and volume of related news coverage (&#x3C1; = 0.88, <italic>P</italic> &lt; .001). Yahoo! cancer search activity tended to be higher on weekdays and during national cancer awareness months but lower during summer months; cancer news coverage also tended to follow these trends. Sharp increases in Yahoo! search activity scores from one day to the next appeared to be associated with increases in relevant news coverage.</p>
                </sec>
                <sec sec-type="conclusions">
                    <title>Conclusions</title>
                    <p> Media coverage appears to play a powerful role in prompting online searches for cancer information. Internet search activity offers an innovative tool for passive surveillance of health information&#x2013;seeking behavior.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>Internet</kwd>
                <kwd>neoplasms</kwd>
                <kwd>health education</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title>Introduction</title>
            <p>Health care providers [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>] and their patients [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref7">7</xref>] regularly search for health information online. Internet users generally begin looking for health information using a search engine [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref12">12</xref>], an Internet tool that searches for Web pages containing terms specified by users [<xref ref-type="bibr" rid="ref13">13</xref>]. In February 2004, Google and Yahoo! were the most popular search engines in the United States, with 38% and 32% of market share, respectively [<xref ref-type="bibr" rid="ref14">14</xref>].</p>
            <p>To date, few studies of Internet search activity related to health topics have been published. Most analyzed the proportion of health and non-health searches on various search engines and found that health searches constituted a small percentage of total searches [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. This finding is not surprising given how infrequently Internet users search for health information compared with how often they look for news reports, product information, and other topics [<xref ref-type="bibr" rid="ref19">19</xref>]. In any case, a small percentage of total Internet searches translates into thousands of health searches each day [<xref ref-type="bibr" rid="ref16">16</xref>], and an estimated 95 million Americans have used the Internet at least once to search for health information [<xref ref-type="bibr" rid="ref20">20</xref>].</p>
            <p>Cancer appears to be a health topic of some interest to Internet users. Eysenbach and K&#xF6;hler [<xref ref-type="bibr" rid="ref16">16</xref>] found that searches for cancer information accounted for 5% of health-related searches on the search engine MetaCrawler. Phillipov and Phillips [<xref ref-type="bibr" rid="ref18">18</xref>] found that &#x201C;skin cancer&#x201D; was one of only 17 health-related search terms among the most popular 300 Internet keywords identified by Wordtracker, a private research company. Bader and Theofanos [<xref ref-type="bibr" rid="ref21">21</xref>] studied cancer searches conducted using the search engine AskJeeves during a 3-month period and found the most commonly searched cancers were digestive/gastrointestinal/bowel, breast, and skin. This study also compared the incidence of selected cancers with their associated search activity. While this relationship was not statistically tested, the authors observed that some rarer cancers constituted a higher proportion of total searches than their proportion of total cancer incidence. In addition, Bader and Theofanos, as well as Phillipov and Phillips, noted that media coverage appeared to prompt Internet searches for health topics, but they did not systematically investigate or test the relationship.</p>
            <p>The study reported here builds on this prior work by analyzing cancer-related searches conducted in the United States from 2001 to 2003 using the search engine Yahoo! Specifically, we investigated three potential correlates of Yahoo! cancer search activity&#x2014;estimated cancer incidence, estimated cancer mortality, and the volume of cancer news coverage. Cancers that afflicted more individuals, claimed more lives, and generated more news coverage were expected to be associated with more Internet search activity than other cancers, given the interest generated by relevance and publicity. In addition, we assessed the periodicity of Yahoo! cancer search activity and examined sharp increases in Yahoo! search activity related to specific cancer types.</p>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <p>This analysis included three types of 2001&#x2013;2003 US data: Yahoo! cancer search activity, cancer burden (estimated incidence and mortality), and cancer news coverage. The study protocol was reviewed by the Institutional Review Board of the National Center for Chronic Disease Prevention and Health Promotion and was designated as &#x201C;research not involving human subjects.&#x201D;</p>
            <sec>
                <title>Yahoo! Cancer Search Activity</title>
                <p>During 2001 (the beginning of the study period), Yahoo! was the most popular US search engine, with a 49% market share; however, in 2003 (the end of the study period), Google surpassed Yahoo! as the leading US search engine [<xref ref-type="bibr" rid="ref22">22</xref>]. Yahoo! remains a widely used search engine; more than 45 million US Internet users conducted Yahoo! searches in February 2004 [<xref ref-type="bibr" rid="ref14">14</xref>].</p>
                <p>Yahoo! maintains a database of search activity called the Yahoo! Buzz Index [<xref ref-type="bibr" rid="ref23">23</xref>]. This index provides a search activity score for individual search terms&#x2014;the words or characters that users type into the Yahoo! search box. Each point of a Yahoo! Buzz Index score equals 0.001% of users searching Yahoo! during the time period of interest (day, week, or month). For example, if 250 out of a total of 1 million users searched for &#x201C;breast cancer&#x201D; on January 1, 2001, the Yahoo! &#x201C;breast cancer&#x201D; search activity score on this day would be 25 (250/1 million &#xD7; 100000). For a search term to register a search activity score, it must generate at least 50 searches during the time period for which the score is calculated. Yahoo! search activity generated by search terms can be segmented by country, US state, or selected US cities. This study used daily US Yahoo! search activity data from January 1, 2001 (the earliest date for which Yahoo! search activity data are available) to December 31, 2003. We limited our analysis to Yahoo! searches because at the time of this study no other Internet search engine offered a dataset like the Yahoo! Buzz Index, which provides search activity scores adjusted for the size of the population searching for online information.</p>
                <p>Yahoo! employs professional &#x201C;surfers&#x201D; or content indexers who manually classify Web pages into one of more than 2000 content categories, such as &#x201C;movies,&#x201D; &#x201C;footwear,&#x201D; &#x201C;astrology,&#x201D; or &#x201C;cancer or neoplasms.&#x201D; The Yahoo! Buzz Index classifies search terms in the same content category as the first Web page link that a user &#x201C;clicks&#x201D; or activates after conducting a search. For instance, if a user entered the search term &#x201C;colon&#x201D; and then clicked on a cancer website, &#x201C;colon&#x201D; would be classified as a &#x201C;cancer or neoplasms&#x201D; search term. If the user clicked on a grammar website, however, &#x201C;colon&#x201D; in that instance would be classified as an &#x201C;education&#x201D; search term. When a user does not click on a Web page link or when a user clicks on a Web page link that has not been classified, the Yahoo! Buzz Index categorizes the search term using a variety of algorithms that analyze recent content viewed by the user.</p>
                <p>To identify commonly used Internet search terms related to specific cancers, we reviewed the search terms classified in the &#x201C;cancer or neoplasms&#x201D; category of the Yahoo! Buzz Index, which generated at least 50 searches in any month from January 2001 to December 2003. This search strategy identified 76 unique search terms, of which 23 were included in the analysis (<xref ref-type="table" rid="table1">Table 1</xref>). The remaining 53 terms were discarded because they did not relate to a specific cancer or included non-English words. Discarded terms included drug names or treatment modalities, such as &#x201C;chemotherapy&#x201D; (n = 19); the names of organizations or events, such as &#x201C;Race for the Cure&#x201D; (n = 16); general cancer or anatomy terms, such as &#x201C;oncology&#x201D; (n = 11); names of celebrities, such as &#x201C;Gilda Radner&#x201D; (n = 5); and the carcinogen &#x201C;DES&#x201D; (n = 1). Also, &#x201C;leucemia&#x201D; (n = 1), the Spanish word for &#x201C;leukemia,&#x201D; was discarded because the Yahoo! Buzz Index does not consistently track foreign words, as it excludes search terms that contain non-English characters. For instance, the Yahoo! Buzz Index would not capture a search term with an accent mark, such as &#x201C;c&#xE1;ncer colorectal&#x201D; (Spanish for &#x201C;colorectal cancer&#x201D;).</p>
            </sec>
            <sec>
                <title>Cancer Burden</title>
                <p>The estimated incidence and mortality for 23 cancers during the study period were obtained from annual burden reports published by the American Cancer Society [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>]. All cancers with at least 7500 new cases in 2001, 2002, or 2003 were included in the analysis (n = 23) whether or not they were associated with Yahoo! search activity.</p>
            </sec>
            <sec>
                <title>Cancer News Coverage</title>
                <p>News reports associated with specific cancer types were identified using the LexisNexis &#x201C;US News&#x201D; database, which includes more than 400 national and regional newspapers, such as the <italic>Wall Street Journal</italic> and the <italic>Baltimore Sun,</italic> and a variety of newswire services, such as the Associated Press and UPI (United Press International). News reports published from January 1, 2001, to December 31, 2003, related to specific cancer types were found by locating reports with the identified Yahoo! search activity terms (eg, &#x201C;breast cancer&#x201D;) in their headlines. In the case of cancers located in the esophagus and oral cavity, for which no Yahoo! search activity terms were associated, the terms &#x201C;esophageal cancer&#x201D; and &#x201C;oral cancer&#x201D; were used as the headline search terms.</p>
            </sec>
            <sec>
                <title>Analysis</title>
                <p>Descriptive statistics were calculated for the Yahoo! search activity score, estimated incidence, estimated morality, and news coverage volume associated with the cancers included in the study. Spearman rank correlations were used to establish the consistency of these variables across the study period, and the data were aggregated. Next, the relationships between Yahoo! search activity and the potential correlates of interest were tested using Spearman rank correlations.</p>
                <p>The relationship between Yahoo! search activity and news coverage was further analyzed for the five cancers with the highest daily Yahoo! search activity. The number of news reports published each day was transformed into a categorical variable with four levels (0 news reports, 1&#x2013;2 news reports, 3&#x2013;4 news reports, and 5 or more news reports), and one-way analysis of variance (ANOVA) was used to compare mean daily Yahoo! search activity scores at increasing levels of news coverage. To detect possible periodicity effects, Yahoo! search activity data were visually inspected. Three possible periodicity effects were noted: a rise during weekdays (Monday&#x2013;Friday) compared with weekends; a rise during national cancer awareness months compared with other months; and a decline during summer months (June&#x2013;August) compared with other months. These possible effects were tested using <italic>t</italic> tests. Finally, the Yahoo! search activity associated with several cancers was marked by sharp increases of 100% or more from one day to the next. For these cancers, we identified the three highest peaks in 2003 Yahoo! search activity and investigated corresponding news events.</p>
            </sec>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <p>We found Internet search terms generating Yahoo! search activity associated with 21 of the 23 cancers included in the study (<xref ref-type="table" rid="table1">Table 1</xref>). Of these, 19 cancers were associated with only one Yahoo! search term each. The 2 remaining cancers were associated with two search terms each: cancers of the brain (&#x201C;brain tumor&#x201D; and &#x201C;brain cancer&#x201D;) and multiple myeloma (&#x201C;multiple myeloma&#x201D; and &#x201C;myeloma&#x201D;). In these cases, the daily Yahoo! search activity scores associated with each term were summed into a composite score for these cancers.</p>
            <p>The highest mean daily Yahoo! search activity scores were generated by breast cancer (mean = 14.37), lung cancer (mean = 9.08), and leukemia (mean = 7.15). Cancers with the highest US 2001&#x2013;2003 incidences were breast (n = 611300), prostate (n = 608000), and lung (n = 510800). For cancer mortality, lung (n = 469500), colorectal (n = 170400), and breast (n = 120800) cancer were the leading causes of death. Breast cancer (n = 5840), leukemia (n = 2143), and prostate cancer (n = 1822) were associated with the most US news reports from 2001 to 2003. Some cancers, such as leukemia, ovarian, and testicular, appeared to be associated with more Internet search activity than their burden would dictate.</p>
            <p>Cancers were ranked by mean daily Yahoo! search activity score, estimated incidence, estimated mortality, and number of related news reports for each year in the study period (2001 to 2003). To explore the consistency of ranks over the study period within each variable, Spearman rank correlations were determined for each pair of years (2001 and 2002, 2002 and 2003, 2001 and 2003). We found statistically significant correlations (<italic>P</italic> &lt; .001) between all year pairs tested (data not shown). Because the ranks associated with these variables were highly consistent from 2001 to 2003, we aggregated the data across the study period.</p>
            <table-wrap position="float" id="table1">
                <label>Table 1</label>
                <caption>
                    <p>Mean daily Yahoo! search activity score (United States, 2001&#x2013;2003), estimated incidence, estimated mortality, and number of news reports, by cancer</p>
                </caption>
                <table border="1" cellpadding="7" cellspacing="0" frame="below" rules="groups" width="551">
                    <col width="75"/>
                    <col width="114"/>
                    <col width="0"/>
                    <col width="77"/>
                    <col width="0"/>
                    <col width="85"/>
                    <col width="0"/>
                    <col width="75"/>
                    <col width="0"/>
                    <col width="83"/>
                    <col width="0"/>
                    <thead>
                        <tr valign="top">
                            <td>
                                <bold>Cancer</bold>
                            </td>
                            <td colspan="2">
                                <bold>Yahoo! Search Terms</bold>
                            </td>
                            <td colspan="2">
                                <bold>Mean Daily Yahoo! Search Activity Score<xref ref-type="table-fn" rid="table1fn1">*</xref>
                                </bold>
                                <bold>(Rank)</bold>
                            </td>
                            <td>
                                <bold>Estimated</bold><break/>
                                <bold>Incidence</bold>
                                <bold>(Rank)</bold>
                            </td>
                            <td colspan="2">
                                <bold>Estimated</bold><break/>
                                <bold>Mortality</bold>
                                <bold>(Rank)</bold>
                            </td>
                            <td colspan="2">
                                <bold>Number of News</bold><break/>
                                <bold>Reports (Rank)</bold>
                            </td>
                            <td/>
                        </tr>
                    </thead>
                    <tbody>
                        <tr valign="top">
                            <td>Breast</td>
                            <td>&#x201C;breast cancer&#x201D;</td>
                            <td colspan="2">14.37 (1)</td>
                            <td colspan="3">611300 (1)</td>
                            <td colspan="2">120800 (3)</td>
                            <td colspan="2">5840 (1)</td>
                        </tr>
                        <tr valign="top">
                            <td>Lung</td>
                            <td>&#x201C;lung cancer&#x201D;</td>
                            <td colspan="2">9.08 (2)</td>
                            <td colspan="3">510800 (3)</td>
                            <td colspan="2">469500 (1)</td>
                            <td colspan="2">918 (5)</td>
                        </tr>
                        <tr valign="top">
                            <td>Leukemia</td>
                            <td>&#x201C;leukemia&#x201D;</td>
                            <td colspan="2">7.15 (3)</td>
                            <td colspan="3">92900 (10)</td>
                            <td colspan="2">65100 (7)</td>
                            <td colspan="2">2143 (2)</td>
                        </tr>
                        <tr valign="top">
                            <td>Colorectal</td>
                            <td>&#x201C;colon cancer&#x201D;</td>
                            <td colspan="2">7.08 (4)</td>
                            <td colspan="3">43120 (4)</td>
                            <td colspan="2">170400 (2)</td>
                            <td colspan="2">617 (6)</td>
                        </tr>
                        <tr valign="top">
                            <td>Prostate</td>
                            <td>&#x201C;prostate cancer&#x201D;</td>
                            <td colspan="2">6.13 (5)</td>
                            <td colspan="3">608000 (2)</td>
                            <td colspan="2">90600 (4)</td>
                            <td colspan="2">1822 (3)</td>
                        </tr>
                        <tr valign="top">
                            <td>Ovary</td>
                            <td>&#x201C;ovarian cancer&#x201D;</td>
                            <td colspan="2">3.71 (6)</td>
                            <td colspan="3">72100 (13)</td>
                            <td colspan="2">42100 (9)</td>
                            <td colspan="2">458 (8)</td>
                        </tr>
                        <tr valign="top">
                            <td>Lymphoma</td>
                            <td>&#x201C;lymphoma&#x201D;</td>
                            <td colspan="2">3.54 (7)</td>
                            <td colspan="3">185500 (5)</td>
                            <td colspan="2">78100 (6)</td>
                            <td colspan="2">480 (7)</td>
                        </tr>
                        <tr valign="top">
                            <td>Uterine, cervix</td>
                            <td>&#x201C;cervical cancer&#x201D;</td>
                            <td colspan="2">2.53 (8)</td>
                            <td colspan="3">38100 (20)</td>
                            <td colspan="2">12600 (19)</td>
                            <td colspan="2">392 (9)</td>
                        </tr>
                        <tr valign="top">
                            <td>Melanoma</td>
                            <td>&#x201C;melanoma&#x201D;</td>
                            <td colspan="2">2.25 (9)</td>
                            <td colspan="3">159200 (7)</td>
                            <td colspan="2">22800 (16)</td>
                            <td colspan="2">376 (10)</td>
                        </tr>
                        <tr valign="top">
                            <td>Brain</td>
                            <td>&#x201C;brain tumor&#x201D;<break/>&#x201C;brain cancer&#x201D;</td>
                            <td colspan="2">1.52 (10)</td>
                            <td colspan="3">52500 (16)</td>
                            <td colspan="2">39300 (10)</td>
                            <td colspan="2">925 (4)</td>
                        </tr>
                        <tr valign="top">
                            <td>Liver</td>
                            <td>&#x201C;liver cancer&#x201D;</td>
                            <td colspan="2">0.70 (11)</td>
                            <td colspan="3">50100 (17)</td>
                            <td colspan="2">42600 (8)</td>
                            <td colspan="2">110 (14)</td>
                        </tr>
                        <tr valign="top">
                            <td>Testis</td>
                            <td>&#x201C;testicular cancer&#x201D;</td>
                            <td colspan="2">0.62 (12)</td>
                            <td colspan="3">22300 (23)</td>
                            <td colspan="2">1200 (23)</td>
                            <td colspan="2">50 (17)</td>
                        </tr>
                        <tr valign="top">
                            <td>Pancreas</td>
                            <td>&#x201C;pancreatic cancer&#x201D;</td>
                            <td colspan="2">0.23 (13)</td>
                            <td colspan="3">90200 (11)</td>
                            <td colspan="2">88600 (5)</td>
                            <td colspan="2">185 (11)</td>
                        </tr>
                        <tr valign="top">
                            <td>Multiple myeloma</td>
                            <td>&#x201C;multiple myeloma&#x201D;<break/>&#x201C;myeloma&#x201D;</td>
                            <td colspan="2">0.11 (14)</td>
                            <td colspan="3">43600 (18)</td>
                            <td colspan="2">32900 (15)</td>
                            <td colspan="2">185 (11)</td>
                        </tr>
                        <tr valign="top">
                            <td>Stomach</td>
                            <td>&#x201C;stomach cancer&#x201D;</td>
                            <td colspan="2">0.08 (15)</td>
                            <td colspan="3">65700 (14)</td>
                            <td colspan="2">37300 (13)</td>
                            <td colspan="2">50 (17)</td>
                        </tr>
                        <tr valign="top">
                            <td>Uterine, corpus</td>
                            <td>&#x201C;uterine cancer&#x201D;</td>
                            <td colspan="2">0.012 (16)</td>
                            <td colspan="3">117700 (8)</td>
                            <td colspan="2">20000 (18)</td>
                            <td colspan="2">17 (22)</td>
                        </tr>
                        <tr valign="top">
                            <td>Larynx</td>
                            <td>&#x201C;throat cancer&#x201D;</td>
                            <td colspan="2">0.012 (16)</td>
                            <td colspan="3">28400 (21)</td>
                            <td colspan="2">11500 (21)</td>
                            <td colspan="2">30 (20)</td>
                        </tr>
                        <tr valign="top">
                            <td>Bladder</td>
                            <td>&#x201C;bladder cancer&#x201D;</td>
                            <td colspan="2">0.010 (18)</td>
                            <td colspan="3">168200 (6)</td>
                            <td colspan="2">37500 (12)</td>
                            <td colspan="2">118 (13)</td>
                        </tr>
                        <tr valign="top">
                            <td>Soft tissue</td>
                            <td>&#x201C;sarcoma&#x201D;</td>
                            <td colspan="2">0.009 (19)</td>
                            <td colspan="3">25300 (22)</td>
                            <td colspan="2">12200 (20)</td>
                            <td colspan="2">25 (21)</td>
                        </tr>
                        <tr valign="top">
                            <td>Thyroid</td>
                            <td>&#x201C;thyroid cancer&#x201D;</td>
                            <td colspan="2">0.002 (20)</td>
                            <td colspan="3">62200 (15)</td>
                            <td colspan="2">4000 (22)</td>
                            <td colspan="2">40 (19)</td>
                        </tr>
                        <tr valign="top">
                            <td>Kidney</td>
                            <td>&#x201C;kidney cancer&#x201D;</td>
                            <td colspan="2">0.001 (21)</td>
                            <td colspan="3">94500 (9)</td>
                            <td colspan="2">35600 (14)</td>
                            <td colspan="2">77 (15)</td>
                        </tr>
                        <tr valign="top">
                            <td>Oral cavity</td>
                            <td>-</td>
                            <td colspan="2">0.000 (22)</td>
                            <td colspan="3">86700 (12)</td>
                            <td colspan="2">22400 (17)</td>
                            <td colspan="2">69 (16)</td>
                        </tr>
                        <tr valign="top">
                            <td>Esophagus</td>
                            <td>-</td>
                            <td colspan="2">0.000 (22)</td>
                            <td colspan="3">40200 (19)</td>
                            <td colspan="2">38100 (11)</td>
                            <td colspan="2">13 (23)</td>
                        </tr>
                    </tbody>
                </table>
                <table-wrap-foot>
                    <fn id="table1fn1"><p><sup>*</sup> Each point of a Yahoo! search activity score equals 0.001% of the population searching Yahoo! on any day.</p>
                    </fn>
                </table-wrap-foot>
            </table-wrap>
            <sec>
                <title>Correlates of Yahoo! Cancer Search Activity</title>
                <p>We tested the relationships between variables by determining Spearman rank correlations between each pair. Statistically significant correlations were found between all variable pairs (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
                <table-wrap position="float" id="table2">
                    <label>Table 2</label>
                    <caption>
                        <p>Spearman rank correlations between mean daily Yahoo! search activity score (United States, 2001&#x2013;2003), estimated incidence, estimated mortality, and number of news reports</p>
                    </caption>
                    <table border="1" cellpadding="7" cellspacing="0" frame="hsides" rules="groups" width="619">
                        <col width="196"/>
                        <col width="131"/>
                        <col width="118"/>
                        <col width="118"/>
                        <thead>
                            <tr valign="top">
                                <td/>
                                <td colspan="3" align="center">
                                    <bold>Spearman Rank Correlation<xref ref-type="table-fn" rid="table2fn1">*</xref>
                                    </bold>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td/>
                                <td>
                                    <bold>Mean Daily Yahoo! Search Activity Score</bold>
                                </td>
                                <td>
                                    <bold>Estimated Incidence</bold>
                                </td>
                                <td>
                                    <bold>Estimated Mortality</bold>
                                </td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Number of news reports</td>
                                <td>.88<sup>
                                        <xref ref-type="table-fn" rid="table2fn2">&#x2020;</xref>
                                    </sup>
                                </td>
                                <td>.62<sup>
                                        <xref ref-type="table-fn" rid="table2fn3">&#x2021;</xref>
                                    </sup>
                                </td>
                                <td>.74<sup>
                                        <xref ref-type="table-fn" rid="table2fn2">&#x2020;</xref>
                                    </sup>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>Estimated mortality</td>
                                <td>.66<sup>
                                        <xref ref-type="table-fn" rid="table2fn2">&#x2020;</xref>
                                    </sup>
                                </td>
                                <td>.71<sup>
                                        <xref ref-type="table-fn" rid="table2fn2">&#x2020;</xref>
                                    </sup>
                                </td>
                                <td>-</td>
                            </tr>
                            <tr valign="top">
                                <td>Estimated incidence</td>
                                <td>.50<sup>
                                        <xref ref-type="table-fn" rid="table2fn4">&#xA7;</xref>
                                    </sup>
                                </td>
                                <td>-</td>
                                <td>-</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table2fn1"><p><sup>*</sup> Spearman rank correlations were done on the rankings reported in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
                        </fn>
                        <fn id="table2fn2"><p><sup>&#x2020;</sup> 
                                <italic>P</italic> &#x2264; .001</p>
                        </fn>
                        <fn id="table2fn3"><p><sup>&#x2021;</sup> 
                                <italic>P</italic> = .002</p>
                        </fn>
                        <fn id="table2fn4"><p><sup>&#xA7;</sup> 
                                <italic>P</italic> = .015</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
                <p>The relationship between Yahoo! search activity and its most statistically significant correlate&#x2014;news coverage&#x2014;was further analyzed for the five cancers with the highest daily Yahoo! search activity (breast, lung, leukemia, colorectal, and prostate). For these cancers, the number of news reports published each day was transformed into a categorical variable with four levels. The mean daily Yahoo! search activity at each level was compared using ANOVA, and all tests were statistically significant (<italic>P</italic> &#x2264; .001). For all five cancers, the mean daily search activity score was higher at each increasing level of news coverage (<xref ref-type="table" rid="table3">Table 3</xref>).</p>
                <table-wrap position="float" id="table3">
                    <label>Table 3</label>
                    <caption>
                        <p>Mean daily Yahoo! search activity score (United States, 2001&#x2013;2003), by number of news reports published daily and cancer</p>
                    </caption>
                    <table border="1" cellpadding="7" cellspacing="0" frame="hsides" rules="groups" width="576">
                        <col width="101"/>
                        <col width="101"/>
                        <col width="101"/>
                        <col width="101"/>
                        <col width="101"/>
                        <thead>
                            <tr valign="top">
                                <td rowspan="2">
                                    <break/>
                                    <break/>
                                    <bold>Cancer</bold>
                                </td>
                                <td colspan="4" align="center">
                                    <bold>Mean Daily Yahoo! Search Activity Score<sup>
                                            <xref ref-type="table-fn" rid="table3fn1">*</xref>
                                            <xref ref-type="table-fn" rid="table3fn2">&#x2020;</xref>
                                        </sup>
                                    </bold>
                                    <bold>(Number of News Reports )</bold>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <bold>Days With</bold>
                                    <bold>0</bold><break/>
                                    <bold>News Reports</bold>
                                </td>
                                <td>
                                    <bold>Days With</bold>
                                    <bold>1&#x2013;2</bold><break/>
                                    <bold>News Reports</bold>
                                </td>
                                <td>
                                    <bold>Days With</bold>
                                    <bold>3&#x2013;4</bold><break/>
                                    <bold>News Reports</bold>
                                </td>
                                <td>
                                    <bold>Days With</bold>
                                    <bold>5+</bold><break/>
                                    <bold>News Reports</bold>
                                </td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Breast</td>
                                <td>10.09 (81)</td>
                                <td>11.49 (278)</td>
                                <td>13.36 (252)</td>
                                <td>17.27 (484)<break/>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>Lung</td>
                                <td>8.27 (633)</td>
                                <td>10.00 (362)</td>
                                <td>10.54 (71)</td>
                                <td>11.71 (29)<break/>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>Leukemia</td>
                                <td>6.89 (248)</td>
                                <td>7.07 (523)</td>
                                <td>7.18 (232)</td>
                                <td>8.26 (92)<break/>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>Colorectal</td>
                                <td>6.72 (739)</td>
                                <td>7.44 (297)</td>
                                <td>8.25 (43)</td>
                                <td>13.92 (16)<break/>
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>Prostate</td>
                                <td>5.30 (390)</td>
                                <td>6.40 (467)</td>
                                <td>6.72 (150)</td>
                                <td>7.43 (88)<break/>
                                </td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table3fn1"><p><sup>*</sup> Each point of a Yahoo! search activity score equals 0.001% of the population searching Yahoo! on any day.</p>
                        </fn>
                        <fn id="table3fn2"><p><sup>&#x2020;</sup> ANOVA was used to compare the mean daily Yahoo! search activity at each level of news coverage. For all five cancer sites, a statistically significant difference (<italic>P</italic> &#x2264; .001) was found.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
            </sec>
            <sec>
                <title>Periodicity of Yahoo! Cancer Search Activity and News Coverage</title>
                <p>Three possible periodicity effects were tested: a rise during weekdays (Monday&#x2013;Friday) compared with weekends; a rise during national cancer awareness months compared with other months; and a decline during summer months (June&#x2013;August) compared with other months. To test for these potential effects, we used the five cancers with the highest daily mean Yahoo! search activity scores (breast, lung, leukemia, colorectal, and prostate) (<xref ref-type="table" rid="table4">Table 4</xref>). For all five cancers tested, both mean daily Yahoo! search activity scores and mean daily news reports were higher Monday&#x2013;Friday than they were Saturday&#x2013;Sunday (<italic>P</italic> &lt; .001). Higher mean daily Yahoo! search activity scores were found for breast cancer (<italic>P</italic> &lt; .001), lung cancer (<italic>P</italic> &lt; .001), and colorectal cancer (<italic>P</italic> &lt; .001) during their respective national awareness months. The number of mean daily news reports related to breast cancer (<italic>P</italic> &lt; .001), colorectal cancer (<italic>P</italic> &lt; .001), and prostate cancer (<italic>P</italic> = .007) rose during their respective national awareness months. Mean daily Yahoo! search activity scores for breast cancer (<italic>P</italic> &lt; .001), lung cancer (<italic>P</italic> &lt; .001), and leukemia (<italic>P</italic> &lt; .001) were lower during the summer months than during the rest of the year. While mean daily news reports about breast cancer also decreased during the summer (<italic>P</italic> &lt; .001), mean daily news reports about prostate cancer rose (<italic>P</italic> = .01).</p>
                <table-wrap position="float" id="table4">
                    <label>Table 4</label>
                    <caption>
                        <p>Periodicity of mean daily Yahoo! search activity score (United States 2001&#x2013;2003) and mean daily number of news reports, by cancer</p>
                    </caption>
                    <table border="1" cellpadding="7" cellspacing="0" frame="hsides" rules="groups" width="859">
                        <colgroup>
                            <col width="65"/>
                            <col width="82"/>
                            <col width="70"/>
                            <col width="70"/>
                            <col width="46"/>
                            <col width="70"/>
                            <col width="70"/>
                            <col width="46"/>
                            <col width="58"/>
                            <col width="70"/>
                            <col width="58"/>
                        </colgroup>
                        <thead>
                            <tr valign="top">
                                <td>
                                    <bold>Cancer</bold>
                                </td>
                                <td/>
                                <td>
                                    <bold>Weekdays</bold>
                                </td>
                                <td>
                                    <bold>Weekends</bold>
                                </td>
                                <td>
                                    <bold>
                                        <italic>P</italic> value</bold>
                                </td>
                                <td>
                                    <bold>Awareness Month</bold>
                                </td>
                                <td>
                                    <bold>Non-Awareness Months</bold>
                                </td>
                                <td>
                                    <bold>
                                        <italic>P</italic> value</bold>
                                </td>
                                <td>
                                    <bold>Summer: June-August</bold>
                                </td>
                                <td>
                                    <bold>Non-Summer</bold>
                                </td>
                                <td>
                                    <bold>
                                        <italic>P</italic> value</bold>
                                </td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td rowspan="2">Breast<break/>
                                </td>
                                <td>Mean Daily Yahoo! Search Activity Score<sup>
                                        <xref ref-type="table-fn" rid="table4fn1">*</xref>
                                    </sup>
                                </td>
                                <td>15.78</td>
                                <td>10.84</td>
                                <td>&lt; .001</td>
                                <td>26.33<break/>
                                </td>
                                <td>13.26</td>
                                <td>&lt; .001</td>
                                <td>10.78</td>
                                <td>15.58</td>
                                <td>&lt; .001</td>
                            </tr>
                            <tr valign="top">
                                <td>Mean Daily Number of News Reports</td>
                                <td>6.26</td>
                                <td>3.02</td>
                                <td>&lt; .001</td>
                                <td>15.30</td>
                                <td>4.41</td>
                                <td>&lt; .001</td>
                                <td>4.19</td>
                                <td>5.72</td>
                                <td>&lt; .001</td>
                            </tr>
                            <tr valign="top">
                                <td rowspan="2">Lung</td>
                                <td>Mean Daily Yahoo! Search Activity Score</td>
                                <td>10.31</td>
                                <td>6.00</td>
                                <td>&lt; .001</td>
                                <td>11.69<break/>
                                </td>
                                <td>8.84</td>
                                <td>&lt; .001</td>
                                <td>5.76</td>
                                <td>10.20</td>
                                <td>&lt;.001</td>
                            </tr>
                            <tr valign="top">
                                <td>Mean Daily Number of News Reports</td>
                                <td>1.03</td>
                                <td>0.37</td>
                                <td>&lt; .001</td>
                                <td>1.03</td>
                                <td>0.82</td>
                                <td>.226</td>
                                <td>0.70<break/>
                                </td>
                                <td>0.89</td>
                                <td>.086</td>
                            </tr>
                            <tr valign="top">
                                <td rowspan="2">Leukemia</td>
                                <td>Mean Daily Yahoo! Search Activity Score</td>
                                <td>8.13</td>
                                <td>4.70</td>
                                <td>&lt; .001</td>
                                <td>6.65<break/>
                                </td>
                                <td>7.20</td>
                                <td>.093</td>
                                <td>5.65</td>
                                <td>7.66</td>
                                <td>&lt; .001</td>
                            </tr>
                            <tr valign="top">
                                <td>Mean Daily Number of News Reports</td>
                                <td>2.20</td>
                                <td>1.34</td>
                                <td>&lt; .001</td>
                                <td>1.51</td>
                                <td>2.00</td>
                                <td>.036</td>
                                <td>1.88</td>
                                <td>1.98</td>
                                <td>.506</td>
                            </tr>
                            <tr valign="top">
                                <td rowspan="2">Colorectal</td>
                                <td>Mean Daily Yahoo! Search Activity Score</td>
                                <td>7.73</td>
                                <td>5.44</td>
                                <td>&lt; .001</td>
                                <td>10.46<break/>
                                </td>
                                <td>6.77</td>
                                <td>&lt; .001</td>
                                <td>6.83</td>
                                <td>7.17</td>
                                <td>.081</td>
                            </tr>
                            <tr valign="top">
                                <td>Mean Daily Number of News Reports</td>
                                <td>0.68</td>
                                <td>0.27</td>
                                <td>&lt; .001</td>
                                <td>1.55</td>
                                <td>0.47</td>
                                <td>&lt; .001</td>
                                <td>0.49</td>
                                <td>0.59</td>
                                <td>.214</td>
                            </tr>
                            <tr valign="top">
                                <td rowspan="2">Prostate</td>
                                <td>Mean Daily Yahoo! Search Activity Score</td>
                                <td>6.82</td>
                                <td>4.41</td>
                                <td>&lt; .001</td>
                                <td>5.68<break/>
                                </td>
                                <td>6.18</td>
                                <td>.044</td>
                                <td>6.14</td>
                                <td>6.13</td>
                                <td>.997</td>
                            </tr>
                            <tr valign="top">
                                <td>Mean Daily Number of News Reports</td>
                                <td>2.03</td>
                                <td>0.74</td>
                                <td>&lt; .001</td>
                                <td>2.39</td>
                                <td>1.60</td>
                                <td>.007</td>
                                <td>2.14</td>
                                <td>1.50</td>
                                <td>.010</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table4fn1"><p><sup>*</sup> Each point of a Yahoo! search activity score equals 0.001% of the population searching Yahoo! on any day.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
            </sec>
            <sec>
                <title>Peaks in Yahoo! Cancer Search Activity and News Coverage</title>
                <p>On several occasions, Yahoo! search activity scores associated with breast cancer, colon cancer, and prostate cancer were marked by sharp increases of 100% or more from one day to the next. We investigated news events that corresponded with the highest three spikes in 2003 Yahoo! search activity for these cancers. These peaks in &#x201C;breast cancer&#x201D; and &#x201C;colon cancer&#x201D; search activity all occurred during their respective national awareness months and appeared to be related to news coverage promoting the awareness months. The highest peak in &#x201C;prostate cancer&#x201D; search activity (22.34) occurred on July 17 after news reports of a study [<xref ref-type="bibr" rid="ref27">27</xref>] exploring the association between sexual behavior and prostate cancer risk (<xref ref-type="fig" rid="figure1">Figure 1</xref>). These news reports generally focused on the possible protective benefit of masturbation. This study was not covered widely by the US news media, but it generated substantial news coverage in Australia and filtered onto the Internet via chat rooms, message boards, and medical news Web pages. While there was no corresponding spike in &#x201C;masturbation&#x201D; search activity, there was a 117% increase in the search activity score (from 61.88 on July 16 to 133.08 on July 17) for &#x201C;masterbation,&#x201D; a common misspelling. The second highest spike in &#x201C;prostate cancer&#x201D; search activity (14.59) occurred on October 21 after news broke that Academy-Award-winning actor Robert DeNiro had been diagnosed with prostate cancer. This story was widely covered by the US news media, and a 277% increase in &#x201C;Robert DeNiro&#x201D; search activity was observed on the same date (from 15.87 on October 20 to 59.90 on October 21). The third highest peak in &#x201C;prostate cancer&#x201D; search activity (12.41) occurred on December 29, when a study linking obesity with increased prostate cancer risk [<xref ref-type="bibr" rid="ref28">28</xref>] was covered by several US news outlets. No corresponding rise in searches for the terms &#x201C;obesity,&#x201D; &#x201C;overweight,&#x201D; or &#x201C;weight loss&#x201D; was observed.</p>
                <p>
                    <fig position="float" id="figure1">
                        <label>Figure 1</label>
                        <caption>
                            <p>2003 US prostate cancer Yahoo! search activity (each point of a Yahoo! search activity score equals 0.001% of the population searching Yahoo! on any day)</p>
                        </caption>
                        <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" position="float" mimetype="image" alt-version="no" xlink:href="jmir_v7i3e36_fig1.jpg"/>
                    </fig>
                </p>
            </sec>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <p>This study suggests that media coverage plays a powerful role in prompting online cancer information seeking. News coverage correlated significantly with Yahoo! search activity (<italic>P</italic> &lt; .001). Also, Yahoo! search activity was found to rise as news coverage increased, and sharp rises in search activity from one day to the next appeared to be associated with increases in relevant news coverage. This study also suggests that the Internet can rapidly disseminate health news: the highest spike in 2003 US &#x201C;prostate cancer&#x201D; Yahoo! search activity seemed to be generated largely by news coverage in Australia that rapidly filtered onto the Internet via chat rooms, message boards, and medical news Web pages. Thus, it possible that a news story does not necessarily have to be covered by the US news media in order to generate US Internet search activity.</p>
            <p>News coverage volume also correlated with estimated cancer incidence (<italic>P</italic> = .015) and mortality (<italic>P</italic> &lt; .001). This is interesting because past studies [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref33">33</xref>] on this topic have not generated consistent findings, with most [<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref32">32</xref>] finding no relationship between disease burden and news coverage volume. However, none of the past studies focused on cancer, and none used our method for identifying news reports. While the news coverage of specific cancers generally matched their burden, we noted that some cancers, such as leukemia, ovarian cancer, and testicular cancer, were associated with more Internet search activity than their burden would suggest. A similar observation was reported by Bader and Theofanos [<xref ref-type="bibr" rid="ref21">21</xref>], who suggested that this discrepancy may result from more searches being required to locate online information about less common cancers. The high correlation between cancer-specific news coverage and associated online search activity in the present study suggests another explanation: some cancers received a disproportionate share of news coverage relative to their incidence and mortality, and online search activity, often prompted by news coverage, reflects this imbalance.</p>
            <p>We detected several periodicity effects in US Yahoo! cancer search activity, which tended to be higher on weekdays and during national cancer awareness months but lower during the summer months. It should be noted that these observations are not artifacts of the size of the online population during these periods because Yahoo! search activity scores are based on the percentage, not the number, of total users. One explanation for these results is that the volume of cancer news coverage tended to follow these trends. It is also possible that users tend to search for online cancer information from school or work settings. As a result, Yahoo! cancer search activity would be expected to drop during weekends when people are at home and over the summer months when many students are out of school and many workers go on vacation.</p>
            <p>Although Yahoo! is a leading US Internet search engine, the extent to which the findings of this study can be generalized to other search engines is not known. Also, we were unable to discern the motivations of Yahoo! users searching for cancer information. For instance, news coverage of a breast cancer drug might be associated with an increase in &#x201C;breast cancer&#x201D; search activity. While the Yahoo! Buzz Index would detect this rise, it cannot tell how many searchers were breast cancer patients or family members and how many were investors interested in buying stock in the company developing the drug.</p>
            <p>Internet search activity offers an innovative tool for passive surveillance of health information&#x2013;seeking behavior. While our work focused on cancer, Internet search activity may be useful in gauging health information seeking related to other diseases. For example, the volume of Internet searches related to symptoms or conditions might be used to predict disease outbreaks (eg, influenza) or to assess mental health following a disaster. Researchers at the Centre for Global eHealth Innovation have begun to experiment with analyses of this type [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. The Yahoo! Buzz Index is unique among Internet search datasets because it provides search activity scores adjusted for the size of the population searching for online information, which has steadily grown each year [<xref ref-type="bibr" rid="ref19">19</xref>]. Perhaps in the future, other Internet search engines will offer databases similar to the Yahoo! Buzz Index, and research could be conducted using a combination of search engines.</p>
        </sec>
    </body>
    <back>
        <ack>
            <p> The Centers for Disease Control and Prevention funded all aspects of this study, including design; collection, management, analysis, and interpretation of the data; and preparation, review, and approval of the manuscript. Yahoo! Inc provided technical support as part of the purchase of a Yahoo! Buzz Index subscription. Use of trade names is for identification only and does not imply endorsement by the US Department of Health and Human Services.</p>
        </ack>
        <fn-group>
            <fn fn-type="conflict">
                
                <p>One of the authors, KP Mallon, was employed by Yahoo! Inc at the time of this study and owns Yahoo! corporate stock.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Sigouin</surname>
                            <given-names>Christopher</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jadad</surname>
                            <given-names>Alejandro R</given-names>
                        </name>
                    </person-group>
                    <article-title>Awareness of sources of peer-reviewed research evidence on the internet</article-title>
                    <source>JAMA</source>
                    <year>2002</year>
                    <month>6</month>
                    <day>5</day>
                    <volume>287</volume>
                    <issue>21</issue>
                    <fpage>2867</fpage>
                    <lpage>9</lpage>
                    <pub-id pub-id-type="pii">joc11825</pub-id>
                    <pub-id pub-id-type="medline">22035782</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Jadad</surname>
                            <given-names>A R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sigouin</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cocking</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Booker</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Whelan</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Browman</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Internet use among physicians, nurses, and their patients</article-title>
                    <source>JAMA</source>
                    <year>2001</year>
                    <month>9</month>
                    <day>26</day>
                    <volume>286</volume>
                    <issue>12</issue>
                    <fpage>1451</fpage>
                    <lpage>2</lpage>
                    <pub-id pub-id-type="pii">jlt0926-4</pub-id>
                    <pub-id pub-id-type="medline">21457056</pub-id>
    <pub-id pub-id-type="doi">10.1001/jama.286.12.1451</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Casebeer</surname>
                            <given-names>L</given-names>
                        </name>
                        <name>
                            <surname>Bennett</surname>
                            <given-names>N</given-names>
                        </name>
                        <name>
                            <surname>Kristofco</surname>
                            <given-names>R</given-names>
                        </name>
                        <name>
                            <surname>Carillo</surname>
                            <given-names>A</given-names>
                        </name>
                        <name>
                            <surname>Centor</surname>
                            <given-names>R</given-names>
                        </name>
                    </person-group>
                    <article-title>Physician Internet medical information seeking and online continuing education use patterns</article-title>
                    <source>J Contin Educ Health Prof</source>
                    <year>2002</year>
                    <volume>21</volume>
                    <issue>1</issue>
                    <fpage>33</fpage>
                    <lpage>42</lpage>
                    <pub-id pub-id-type="doi">10.1002/chp.1340220105</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Baker</surname>
                            <given-names>Laurence</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wagner</surname>
                            <given-names>Todd H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Singer</surname>
                            <given-names>Sara</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bundorf</surname>
                            <given-names>M Kate</given-names>
                        </name>
                    </person-group>
                    <article-title>Use of the Internet and e-mail for health care information: results from a national survey</article-title>
                    <source>JAMA</source>
                    <year>2003</year>
                    <month>5</month>
                    <day>14</day>
                    <volume>289</volume>
                    <issue>18</issue>
                    <fpage>2400</fpage>
                    <lpage>6</lpage>
                    <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jama.ama-assn.org/cgi/pmidlookup?view=long&amp;pmid=12746364" ext-link-type="uri">http://jama.ama-assn.org/cgi/pmidlookup?view=long&amp;pmid=12746364</ext-link></comment>
                    <pub-id pub-id-type="doi">10.1001/jama.289.18.2400</pub-id>
                    <pub-id pub-id-type="pii">289/18/2400</pub-id>
                    <pub-id pub-id-type="medline">22631234</pub-id>
                    </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Diaz</surname>
                            <given-names>Joseph A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Griffith</surname>
                            <given-names>Rebecca A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ng</surname>
                            <given-names>James J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Reinert</surname>
                            <given-names>Steven E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Friedmann</surname>
                            <given-names>Peter D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Moulton</surname>
                            <given-names>Anne W</given-names>
                        </name>
                    </person-group>
                    <article-title>Patients' use of the Internet for medical information</article-title>
                    <source>J Gen Intern Med</source>
                    <year>2002</year>
                    <month>3</month>
                    <volume>17</volume>
                    <issue>3</issue>
                    <fpage>180</fpage>
                    <lpage>5</lpage>
                    <pub-id pub-id-type="pii">jgi10603</pub-id>
                    <pub-id pub-id-type="medline">21927189</pub-id>
                    <pub-id pub-id-type="doi">10.1046/j.1525-1497.2002.10603.x</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Murray</surname>
                            <given-names>Elizabeth</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lo</surname>
                            <given-names>Bernard</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pollack</surname>
                            <given-names>Lance</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Donelan</surname>
                            <given-names>Karen</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Catania</surname>
                            <given-names>Joe</given-names>
                        </name>
                        <name name-style="western">
                            <surname>White</surname>
                            <given-names>Martha</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zapert</surname>
                            <given-names>Kinga</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Turner</surname>
                            <given-names>Rachel</given-names>
                        </name>
                    </person-group>
                    <article-title>The impact of health information on the internet on the physician-patient relationship: patient perceptions</article-title>
                    <source>Arch Intern Med</source>
                    <year>2003</year>
                    <month>7</month>
                    <day>28</day>
                    <volume>163</volume>
                    <issue>14</issue>
                    <fpage>1727</fpage>
                    <lpage>34</lpage>
                    <pub-id pub-id-type="doi">10.1001/archinte.163.14.1727</pub-id>
                    <pub-id pub-id-type="pii">163/14/1727</pub-id>
                    <pub-id pub-id-type="medline">22767590</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Fox</surname>
                            <given-names>S</given-names>
                        </name>
                        <name>
                            <surname>Fallows</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <source>Internet health resources: health searches and email have become more commonplace, but there is room for improvement in searches and overall Internet access</source>
                    <year>2003</year>
                    <publisher-loc>Washington, DC</publisher-loc>
                    <publisher-name>Pew Internet &amp; American Life Project</publisher-name>
                    <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/pdfs/PIP_Health_Report_July_2003.pdf" ext-link-type="uri">http://www.pewinternet.org/pdfs/PIP_Health_Report_July_2003.pdf</ext-link></comment>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>Gunther</given-names>
                        </name>
                        <name name-style="western">
                            <surname>K&#xF6;hler</surname>
                            <given-names>Christian</given-names>
                        </name>
                    </person-group>
                    <article-title>How do consumers search for and appraise health information on the world wide web? Qualitative study using focus groups, usability tests, and in-depth interviews</article-title>
                    <source>BMJ</source>
                    <year>2002</year>
                    <month>3</month>
                    <day>9</day>
                    <volume>324</volume>
                    <issue>7337</issue>
                    <fpage>573</fpage>
                    <lpage>7</lpage>
                    <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bmj.com/cgi/pmidlookup?view=long&amp;pmid=11884321" ext-link-type="uri">http://bmj.com/cgi/pmidlookup?view=long&amp;pmid=11884321</ext-link></comment>
                    <pub-id pub-id-type="medline">21881326</pub-id>
                    </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Fox</surname>
                            <given-names>S</given-names>
                        </name>
                        <name>
                            <surname>Rainie</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <source>Vital decisions: how Internet users decide what information to trust when they or their loved ones are sick</source>
                    <year>2002</year>
                    <publisher-loc>Washington, DC</publisher-loc>
                    <publisher-name>Pew Internet &amp; American Life Project</publisher-name>
                    <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/pdfs/PIP_Vital_Decisions_May2002.pdf" ext-link-type="uri">http://www.pewinternet.org/pdfs/PIP_Vital_Decisions_May2002.pdf</ext-link></comment>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Frisby</surname>
                            <given-names>Genevieve</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bessell</surname>
                            <given-names>Tracey L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Borland</surname>
                            <given-names>Ron</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Anderson</surname>
                            <given-names>Jeremy N</given-names>
                        </name>
                    </person-group>
                    <article-title>Smoking cessation and the Internet: a qualitative method examining online consumer behavior</article-title>
                    <source>J Med Internet Res</source>
                    <year>2002</year>
                    <month>11</month>
                    <day>22</day>
                    <volume>4</volume>
                    <issue>2</issue>
                    <fpage>E8</fpage>
                    <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2002/2/e8/" ext-link-type="uri">http://www.jmir.org/2002/2/e8/</ext-link></comment>
                    <pub-id pub-id-type="medline">22442440</pub-id>
                    <pub-id pub-id-type="doi">10.2196/jmir.4.2.e8</pub-id>
                    </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>O'connor</surname>
                            <given-names>JB</given-names>
                        </name>
                        <name>
                            <surname>Johanson</surname>
                            <given-names>JF</given-names>
                        </name>
                    </person-group>
                    <article-title>Use of the Web for medical information by a gastroenterology clinic population</article-title>
                    <source>J Amer Med Assoc</source>
                    <year>2000</year>
                    <volume>284</volume>
                    <issue>15</issue>
                    <fpage>1962</fpage>
                    <lpage>1964</lpage>
                    <pub-id pub-id-type="doi">10.1001/jama.284.15.1962</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Peterson</surname>
                            <given-names>Geraldine</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Aslani</surname>
                            <given-names>Parisa</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Williams</surname>
                            <given-names>Kylie A</given-names>
                        </name>
                    </person-group>
                    <article-title>How do consumers search for and appraise information on medicines on the Internet? A qualitative study using focus groups</article-title>
                    <source>J Med Internet Res</source>
                    <year>2003</year>
                    <month>12</month>
                    <day>19</day>
                    <volume>5</volume>
                    <issue>4</issue>
                    <fpage>e33</fpage>
                    <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2003/4/e33/" ext-link-type="uri">http://www.jmir.org/2003/4/e33/</ext-link></comment>
                    <pub-id pub-id-type="medline">14713661</pub-id>
                    <pub-id pub-id-type="doi">10.2196/jmir.5.4.e33</pub-id>
                    </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wilkas</surname>
                            <given-names>L R</given-names>
                        </name>
                    </person-group>
                    <article-title>Scientific inquiry: an introduction to search engines</article-title>
                    <source>J Soc Pediatr Nurs</source>
                    <year>2001</year>
                    <volume>6</volume>
                    <issue>3</issue>
                    <fpage>149</fpage>
                    <lpage>51</lpage>
                    <pub-id pub-id-type="medline">21420286</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Lynch</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>Google tops search sites as users flock to features</article-title>
                    <source>New York Post</source>
                    <year>2004</year>
                    <month>2</month>
                    <day>24</day>
                    <fpage>32</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kohler</surname>
                            <given-names>Ch</given-names>
                        </name>
                    </person-group>
                    <article-title>What is the prevalence of health-related searches on the World Wide Web? Qualitative and quantitative analysis of search engine queries on the internet</article-title>
                    <source>AMIA Annu Symp Proc</source>
                    <year>2003</year>
                    <fpage>225</fpage>
                    <lpage>9</lpage>
                    <pub-id pub-id-type="medline">14728167</pub-id>
                    <pub-id pub-id-type="pii">D030003690</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>Gunther</given-names>
                        </name>
                        <name name-style="western">
                            <surname>K&#xF6;hler</surname>
                            <given-names>Christian</given-names>
                        </name>
                    </person-group>
                    <article-title>Health-related searches on the Internet</article-title>
                    <source>JAMA</source>
                    <year>2004</year>
                    <month>6</month>
                    <day>23</day>
                    <volume>291</volume>
                    <issue>24</issue>
                    <fpage>2946</fpage>
                    <pub-id pub-id-type="medline">15213205</pub-id>
                    <pub-id pub-id-type="doi">10.1001/jama.291.24.2946</pub-id>
                    <pub-id pub-id-type="pii">291/24/2946</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Spink</surname>
                            <given-names>Amanda</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yang</surname>
                            <given-names>Yin</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jansen</surname>
                            <given-names>Jim</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nykanen</surname>
                            <given-names>Pirrko</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lorence</surname>
                            <given-names>Daniel P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ozmutlu</surname>
                            <given-names>Seda</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ozmutlu</surname>
                            <given-names>H Cenk</given-names>
                        </name>
                    </person-group>
                    <article-title>A study of medical and health queries to web search engines</article-title>
                    <source>Health Info Libr J</source>
                    <year>2004</year>
                    <month>3</month>
                    <volume>21</volume>
                    <issue>1</issue>
                    <fpage>44</fpage>
                    <lpage>51</lpage>
                    <pub-id pub-id-type="medline">15023208</pub-id>
                    <pub-id pub-id-type="doi">10.1111/j.1471-1842.2004.00481.x</pub-id>
                    <pub-id pub-id-type="pii">HIR481</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Phillipov</surname>
                            <given-names>George</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Phillips</surname>
                            <given-names>Patrick J</given-names>
                        </name>
                    </person-group>
                    <article-title>Frequency of health-related search terms on the Internet</article-title>
                    <source>JAMA</source>
                    <year>2003</year>
                    <month>11</month>
                    <day>5</day>
                    <volume>290</volume>
                    <issue>17</issue>
                    <fpage>2258</fpage>
                    <lpage>9</lpage>
                    <pub-id pub-id-type="doi">10.1001/jama.290.17.2258</pub-id>
                    <pub-id pub-id-type="pii">290/17/2258</pub-id>
                    <pub-id pub-id-type="medline">22962627</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Madden</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <source>America's online pursuits: the changing picture of who's online and what they do</source>
                    <year>2003</year>
                    <publisher-loc>Washington DC</publisher-loc>
                    <publisher-name>Pew Internet &amp; American Life Project</publisher-name>
                    <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/pdfs/PIP_Online_Pursuits_Final.PDF" ext-link-type="uri">http://www.pewinternet.org/pdfs/PIP_Online_Pursuits_Final.PDF</ext-link></comment>
                </nlm-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Fox</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <source>Health information online: eight in ten Internet users have looked for health information online, with increased interest in diet, fitness, drugs, health insurance, experimental treatments, and particular doctors and hospitals</source>
                    <year>2005</year>
                    <publisher-loc>Washington DC</publisher-loc>
                    <publisher-name>Pew Internet &amp; American Life Project</publisher-name>
                    <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/pdfs/PIP_Healthtopics_May05.pdf" ext-link-type="uri">http://www.pewinternet.org/pdfs/PIP_Healthtopics_May05.pdf</ext-link></comment>
                </nlm-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bader</surname>
                            <given-names>Judith L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Theofanos</surname>
                            <given-names>Mary Frances</given-names>
                        </name>
                    </person-group>
                    <article-title>Searching for cancer information on the internet: analyzing natural language search queries</article-title>
                    <source>J Med Internet Res</source>
                    <year>2003</year>
                    <month>12</month>
                    <day>11</day>
                    <volume>5</volume>
                    <issue>4</issue>
                    <fpage>e31</fpage>
                    <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2003/4/e31/" ext-link-type="uri">http://www.jmir.org/2003/4/e31/</ext-link></comment>
                    <pub-id pub-id-type="medline">14713659</pub-id>
                    <pub-id pub-id-type="doi">10.2196/jmir.5.4.e31</pub-id>
                    </nlm-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Elgin</surname>
                            <given-names>B</given-names>
                        </name>
                    </person-group>
                    <article-title>The search war is about to get bloody</article-title>
                    <source>Business Week</source>
                    <year>2003</year>
                    <month>7</month>
                    <day>28</day>
                    <volume>3843</volume>
                    <fpage>72</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <nlm-citation citation-type="web">
                    <collab collab-type="authors">Yahoo! Buzz Index</collab>
                    <source>Home page</source>
                    <access-date>2005 Jun 27</access-date>
                    <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://buzz.yahoo.com/client/" ext-link-type="uri">https://buzz.yahoo.com/client/</ext-link></comment>
                </nlm-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <nlm-citation citation-type="book">
                    <collab collab-type="authors">American Cancer Society</collab>
                    <source>Cancer Facts &amp; Figures 2001</source>
                    <year>2001</year>
                    <publisher-loc>Atlanta, GA</publisher-loc>
                    <publisher-name>American Cancer Society Inc</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <nlm-citation citation-type="book">
                    <collab collab-type="authors">American Cancer Society</collab>
                    <source>Cancer Facts &amp; Figures 2002</source>
                    <year>2002</year>
                    <publisher-loc>Atlanta, GA</publisher-loc>
                    <publisher-name>American Cancer Society Inc</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <nlm-citation citation-type="book">
                    <collab collab-type="authors">American Cancer Society</collab>
                    <source>Cancer Facts &amp; Figures 2003</source>
                    <year>2003</year>
                    <publisher-loc>Atlanta, GA</publisher-loc>
                    <publisher-name>American Cancer Society Inc</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Giles</surname>
                            <given-names>G G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Severi</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>English</surname>
                            <given-names>D R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mccredie</surname>
                            <given-names>M R E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Borland</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Boyle</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hopper</surname>
                            <given-names>J L</given-names>
                        </name>
                    </person-group>
                    <article-title>Sexual factors and prostate cancer</article-title>
                    <source>BJU Int</source>
                    <year>2003</year>
                    <month>8</month>
                    <volume>92</volume>
                    <issue>3</issue>
                    <fpage>211</fpage>
                    <lpage>6</lpage>
                    <pub-id pub-id-type="pii">4319</pub-id>
                    <pub-id pub-id-type="medline">22769687</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Irani</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lefebvre</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Murat</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dahmani</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dor&#xE9;</surname>
                            <given-names>B</given-names>
                        </name>
                    </person-group>
                    <article-title>Obesity in relation to prostate cancer risk: comparison with a population having benign prostatic hyperplasia</article-title>
                    <source>BJU Int</source>
                    <year>2003</year>
                    <month>4</month>
                    <volume>91</volume>
                    <issue>6</issue>
                    <fpage>482</fpage>
                    <lpage>4</lpage>
                    <pub-id pub-id-type="pii">4133</pub-id>
                    <pub-id pub-id-type="medline">22543703</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref29">
                <label>29</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Adelman</surname>
                            <given-names>R C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Verbrugge</surname>
                            <given-names>L M</given-names>
                        </name>
                    </person-group>
                    <article-title>Death makes news: the social impact of disease on newspaper coverage</article-title>
                    <source>J Health Soc Behav</source>
                    <year>2000</year>
                    <month>9</month>
                    <volume>41</volume>
                    <issue>3</issue>
                    <fpage>347</fpage>
                    <lpage>67</lpage>
                    <pub-id pub-id-type="medline">20465891</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref30">
                <label>30</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Van Der Wardt</surname>
                            <given-names>E M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Taal</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rasker</surname>
                            <given-names>J J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wiegman</surname>
                            <given-names>O</given-names>
                        </name>
                    </person-group>
                    <article-title>Media coverage of chronic diseases in the Netherlands</article-title>
                    <source>Semin Arthritis Rheum</source>
                    <year>1999</year>
                    <month>4</month>
                    <volume>28</volume>
                    <issue>5</issue>
                    <fpage>333</fpage>
                    <lpage>41</lpage>
                    <pub-id pub-id-type="medline">99271819</pub-id>
                    <pub-id pub-id-type="doi">10.1016/S0049-0172(99)80018-3</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref31">
                <label>31</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Frost</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Frank</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Maibach</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Relative risk in the news media: a quantification of misrepresentation</article-title>
                    <source>Am J Public Health</source>
                    <year>1997</year>
                    <month>5</month>
                    <volume>87</volume>
                    <issue>5</issue>
                    <fpage>842</fpage>
                    <lpage>5</lpage>
                    <pub-id pub-id-type="medline">97327959</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref32">
                <label>32</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Kristiansen</surname>
                            <given-names>CM</given-names>
                        </name>
                    </person-group>
                    <article-title>Newspaper coverage of diseases and actual mortality statistics</article-title>
                    <source>Eur J Soc Psychol</source>
                    <year>1983</year>
                    <volume>13</volume>
                    <fpage>193</fpage>
                    <lpage>194</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref33">
                <label>33</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Combs</surname>
                            <given-names>B</given-names>
                        </name>
                        <name>
                            <surname>Slovic</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Newspaper coverage of causes of death</article-title>
                    <source>Journalism Quart</source>
                    <year>1979</year>
                    <fpage>837</fpage>
                    <lpage>843</lpage>
                    <fpage>849</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref34">
                <label>34</label>
                <nlm-citation citation-type="journal" xlink:type="simple">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>Gunther</given-names>
                        </name>
                    </person-group>
                    <article-title>SARS and population health technology</article-title>
                    <source>J Med Internet Res</source>
                    <year>2003</year>
                    <month>6</month>
                    <day>30</day>
                    <volume>5</volume>
                    <issue>2</issue>
                    <fpage>e14</fpage>
                    <comment><ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2003/2/e14/" ext-link-type="uri">http://www.jmir.org/2003/2/e14/</ext-link></comment>
                    <pub-id pub-id-type="medline">22741895</pub-id>
                    <pub-id pub-id-type="doi">10.2196/jmir.5.2.e14</pub-id>
                    </nlm-citation>
            </ref>
            <ref id="ref35">
                <label>35</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name>
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Infodemiology: toward methods and measures for understanding and quantifying the distribution, determinants, and impact of information</article-title>
                    <source>Proc AMIA Annu Fall Symp</source>
                    <year>2005</year>
                    <comment>[submitted]</comment>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>
