<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">JMIR</journal-id>
            <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
            <journal-title>Journal of Medical Internet Research</journal-title>
            <issn pub-type="epub">14388871</issn>
            <publisher>
                <publisher-name>JMIR Publications Inc.</publisher-name>
                <publisher-loc>Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v15i9e192</article-id>
            <article-id pub-id-type="pmid">23999327</article-id>
            <article-id pub-id-type="doi">10.2196/jmir.2180</article-id>
            <article-categories>
                <subj-group subj-group-type="article-type">
                    <subject>Original Paper</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Infodemiology of Alcohol Use in Hong Kong Mentioned on Blogs: Infoveillance Study</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="editor">
                    <name>
                        <surname>Eysenbach</surname>
                        <given-names>Gunther</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Leal Neto</surname>
                        <given-names>Onicio</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Durant</surname>
                        <given-names>Kathleen</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Jiang</surname>
                        <given-names>Yunliang</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Li</surname>
                        <given-names>Jingquan</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Perez-Rey</surname>
                        <given-names>David</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>West</surname>
                        <given-names>Joshua</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1" equal-contrib="yes">
                    <name name-style="western">
                        <surname>Chan</surname>
                        <given-names>KL</given-names>
                    </name>
                    <degrees>MBBS</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                </contrib>
                <contrib contrib-type="author" id="contrib2" corresp="yes" equal-contrib="yes">
                    <name name-style="western">
                        <surname>Ho</surname>
                        <given-names>SY</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                    <address>
                        <institution>School of Public Health, The University of Hong Kong</institution>
                        <addr-line>21 Sassoon Road, Pokfulam</addr-line>
                        <addr-line>Hong Kong</addr-line>
                        <country>China (Hong Kong)</country>
                        <phone>852 28199883</phone>
                        <fax>852 28559528</fax>
                        <email>syho@hku.hk</email>
                    </address>
                </contrib>
                <contrib contrib-type="author" id="contrib3" equal-contrib="yes">
                    <name name-style="western">
                        <surname>Lam</surname>
                        <given-names>TH</given-names>
                    </name>
                    <degrees>MD</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                </contrib>
            </contrib-group>
            <aff id="aff1" rid="aff1">
                <sup>1</sup>
                <institution>School of Public Health, The University of Hong Kong</institution>
                <addr-line>Hong Kong</addr-line>
                <country>China (Hong Kong)</country>
            </aff>
            <author-notes>
                <corresp>Corresponding Author: SY Ho <email>syho@hku.hk</email>
                </corresp>
            </author-notes>
            <pub-date pub-type="collection">
                <month>09</month>
                <year>2013</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>02</day>
                <month>09</month>
                <year>2013</year>
            </pub-date>
            <volume>15</volume>
            <issue>9</issue>
            <elocation-id>e192</elocation-id>
            <!--history from ojs - api-xml-->
            <history>
                <date date-type="received">
                    <day>23</day>
                    <month>05</month>
                    <year>2012</year>
                </date>
                <date date-type="rev-request">
                    <day>29</day>
                    <month>07</month>
                    <year>2012</year>
                </date>
                <date date-type="rev-recd">
                    <day>29</day>
                    <month>08</month>
                    <year>2012</year>
                </date>
                <date date-type="accepted">
                    <day>25</day>
                    <month>06</month>
                    <year>2013</year>
                </date>
            </history>
            <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
            <copyright-statement>&#169;KL Chan, SY Ho, TH Lam. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 02.09.2013. </copyright-statement>
            <copyright-year>2013</copyright-year>
            <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
                <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
            </license>
            <self-uri xlink:href="http://www.jmir.org/2013/9/e192/" xlink:type="simple" />
            <abstract>
                <sec sec-type="Background">
                    <title>Background</title>
                    <p>In 2007 and 2008, the beer and wine tax in Hong Kong was halved and then abolished, resulting in an increase of alcohol consumption. The prevalence of the Internet and a high blogging rate by adolescents and adults present a unique opportunity to study drinking patterns by infodemiology.</p>
                </sec>
                <sec sec-type="Objective">
                    <title>Objective</title>
                    <p>To assess and explain the online use of alcohol-related Chinese keywords and to validate blog searching as an infoveillance method for surveying changes in drinking patterns (eg, alcohol type) in Hong Kong people (represented by bloggers on a Hong Kong&#8211;based Chinese blogging site) in 2005-2010.</p>
                </sec>
                <sec sec-type="Methods">
                    <title>Methods</title>
                    <p>Blog searching was done using a blog search engine, Google Blog Search, in the archives of a Hong Kong&#8211;based blog service provider, MySinaBlog from 2005-2010. Three groups of Chinese keywords, each representing a specific alcohol-related concept, were used: (1) &#8220;alcohol&#8221; (ie, the control concept), (2) &#8220;beer or wine&#8221;, and (3) &#8220;spirit&#8221;. The resulting blog posts were analyzed quantitatively using infodemiological metrics and correlation coefficients, and qualitatively by manual effort. The infodemiological metrics were (1) apparent prevalence, (2) actual prevalence, (3) prevalence rate, and (4) prevalence ratio. Pearson and Spearman correlations were calculated for prevalence rates and ratios with respect to per capita alcohol consumption. Manual analysis focused on (1) blog author characteristics (ie, authorship, sex, and age), and (2) blog content (ie, frequency of keywords, description of a discrete episode of alcohol drinking, drinking amount, and genres).</p>
                </sec>
                <sec sec-type="Results">
                    <title>Results</title>
                    <p>The online use of alcohol-related concepts increased noticeably for &#8220;alcohol&#8221; in 2008 and &#8220;spirit&#8221; in 2008-2009 but declined for &#8220;beer or wine&#8221; over the years. Correlation between infodemiological and epidemiological data was only significant for the &#8220;alcohol&#8221; prevalence rate. Most blogs were managed by single authors. Their sex distribution was even, and the majority were aged 18 and above. Not all Chinese keywords were found. Many of the blog posts did not describe a discrete episode of alcohol drinking and were classified as personal diary, opinion, or emotional outlets. The rest lacked information on drinking amount, which hindered assessment of binge drinking.</p>
                </sec>
                <sec sec-type="Conclusions">
                    <title>Conclusions</title>
                    <p>The prevalence of alcohol-related Chinese keywords online was attributed to many different factors, including spam, and hence not a specific reflection of local drinking patterns. Correlation between infodemiological data (represented by prevalence rates and ratios of alcohol-related concepts) and epidemiological data (represented by per capita alcohol consumption) was poor. Many blog posts were affective rather than informative in nature. Semantic analysis of blog content was recommended given enough expertise and resources.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>alcohol drinking</kwd>
                <kwd>blogging</kwd>
                <kwd>blog search</kwd>
                <kwd>Chinese</kwd>
                <kwd>Hong Kong</kwd>
                <kwd>infodemiology</kwd>
                <kwd>infoveillance</kwd>
                <kwd>Internet</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title>Introduction</title>
            <sec>
                <title>Alcohol Use and Tax Policies in Hong Kong</title>
                <p>Although often overlooked, alcohol is a human carcinogen [<xref ref-type="bibr" rid="ref1">1</xref>]. It causes 2.5 million deaths each year worldwide [<xref ref-type="bibr" rid="ref2">2</xref>], and the United Nations has identified its harmful use as one of the four most important risk factors for noncommunicable diseases [<xref ref-type="bibr" rid="ref3">3</xref>]. In Hong Kong, although alcohol consumption is still low, it is not uncommon. Alcohol is easily accessible by the general population due to a lack of regulation of minimum age for off-premises sales (with &#8220;premises&#8221; defined as restaurants and bars granted with a liquor license) [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Local studies have shown that almost one-third of adults and one-fourth of secondary school students drink alcohol [<xref ref-type="bibr" rid="ref6">6</xref>]. The adverse health effects are daunting. According to the data released by the Department of Health in 2006-10, there was an annual average of more than 2000 episodes of in-patient discharges and deaths due to an alcohol-related disease [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
                <p>Nonetheless, the Hong Kong Special Administrative Region (HKSAR) Government halved the duty on beer and wine with an alcoholic strength of not more than 30% in 2007 [<xref ref-type="bibr" rid="ref7">7</xref>], and abolished it altogether in 2008 [<xref ref-type="bibr" rid="ref8">8</xref>]. The duty rate on spirits with an alcoholic strength of more than 30% remained at 100% [<xref ref-type="bibr" rid="ref8">8</xref>]. These unprecedented and anti-public health policies were aimed to help Hong Kong develop into an international wine trading hub, at the cost of increased alcohol-related harms to public health [<xref ref-type="bibr" rid="ref9">9</xref>]. The Working Group on Alcohol and Health of the Department of Health noticed a surge in the alcohol consumption per capita in Hong Kong in 2008, which was attributed to the lowered price of beer and wine in the same year [<xref ref-type="bibr" rid="ref4">4</xref>]. This echoed a meta-analysis of 112 studies, which found an inverse relation of alcohol tax or price with consumption [<xref ref-type="bibr" rid="ref10">10</xref>]. In Finland, the one-third reduction of excise duties on alcoholic beverages in 2004 resulted in a clear rise in alcohol consumption and related harms [<xref ref-type="bibr" rid="ref11">11</xref>], including hospitalization rate [<xref ref-type="bibr" rid="ref12">12</xref>] and number of sudden deaths [<xref ref-type="bibr" rid="ref13">13</xref>]. The drastic change of beer and wine tax policy in Hong Kong presents a unique opportunity to study alcohol drinking using infodemiology.</p>
            </sec>
            <sec>
                <title>Infodemiology and Infoveillance</title>
                <p>Infodemiology is a portmanteau of information and epidemiology, which is, according to Eysenbach, &#8220;the science of distribution and determinants of information in an electronic medium, specifically the Internet, or in a population, with the ultimate aim to inform public health and public policy&#8221; [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. It is based on a bidirectional relation between population health status/attitudes/behavior and information patterns on the Internet [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Originally used to identify inaccurate health information on the Internet [<xref ref-type="bibr" rid="ref17">17</xref>], it was later found that search engine query data could predict influenza epidemics [<xref ref-type="bibr" rid="ref18">18</xref>]. Given its implication in public health and policy, infodemiology has since been used as a complement to traditional epidemiological studies [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>], using analytical methods and metrics such as keyword prevalence and prevalence ratio [<xref ref-type="bibr" rid="ref14">14</xref>]. The longitudinal tracking of infodemiology metrics for surveillance and trend analysis is called infoveillance [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>].</p>
                <p>Over the past decade, efforts have been made to overcome the difficulties in aggregating and analyzing the vast, unstructured information from the online database [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Examples of infodemiology within the public health sector include detection of disease outbreak or incidence by tracking search queries [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref20">20</xref>], investigating online search behavior for suicide-related information [<xref ref-type="bibr" rid="ref21">21</xref>], monitoring public reactions towards health-related policy and campaigns [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>], and identifying public health concerns from user posts in social networking sites such as Twitter [<xref ref-type="bibr" rid="ref24">24</xref>]. Several computer tools have also been developed that allow more effective infodemiological analysis (eg, Technosocial Predictive Analytics [<xref ref-type="bibr" rid="ref25">25</xref>], Infovigil [<xref ref-type="bibr" rid="ref15">15</xref>], Global Public Health Intelligence Network, and HealthMap [<xref ref-type="bibr" rid="ref26">26</xref>]). All these are underpinned by the technology of Web 2.0, which features individuation, open property, sociality, and microcontent [<xref ref-type="bibr" rid="ref27">27</xref>]. One established example of Web 2.0 is online social networking.</p>
            </sec>
            <sec>
                <title>Online Social Networking, Blogs, and Blog Searching</title>
                <p>Online social networking is constantly evolving. With proper mining and analytic technique [<xref ref-type="bibr" rid="ref28">28</xref>], it might be possible to extract useful information from these networking sites for research purpose. Blogs (also called weblogs) are a kind of social networking website that is regarded as a relatively new form of mainstream personal communication [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. They are characterized as being personalized, Web-based, community-supported, and automated [<xref ref-type="bibr" rid="ref31">31</xref>]. Blog contents are versatile. They could be about the blogger&#8217;s life, commentaries, ideas, and emotions. They are also used to form and maintain community forums [<xref ref-type="bibr" rid="ref32">32</xref>]. While some blogs are employed for political, educational, and commercial purposes [<xref ref-type="bibr" rid="ref33">33</xref>], most are likened to diaries and are referred to as personal blogs [<xref ref-type="bibr" rid="ref34">34</xref>]. People using blog services are referred to as bloggers.</p>
                <p>Like other social networking sites, blogs are featured by their time stamps, consumer-generated content, and expansile database, making them potentially useful for longitudinal data retrieval and analysis [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. In fact, blog analysis has become increasingly popular in various domains. Examples of its application include assessing a company&#8217;s image strength or customer product, monitoring public opinion in presidential elections, evaluating public reaction to disasters, tracing online hate groups or people with suicidal intent, studying youth cultures, and analyzing linguistic patterns [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref37">37</xref>-<xref ref-type="bibr" rid="ref40">40</xref>]. The prerequisite of blog analysis for public surveillance is that a large proportion of the population should use the social Web services regularly, so that online information can be kept up-to-date and truly reflect the contemporary interest or concern of the community [<xref ref-type="bibr" rid="ref25">25</xref>].</p>
            </sec>
            <sec>
                <title>Internet Use and Blogging in Hong Kong: Applying Blog Searches in Local Public Health Research</title>
                <p>Internet use is ubiquitous in Hong Kong. In a survey by the HKSAR Government, Internet penetration of local population continued to rise over the years, from 56.9% in 2005 to 72.8% in 2012. Almost 70% of the online population were adolescents and adults aged 10-44 [<xref ref-type="bibr" rid="ref41">41</xref>]. They also constituted the largest population engaging in online social networking activities including blogs and forums [<xref ref-type="bibr" rid="ref42">42</xref>]. This was consistent with an older study by Blog-You.com and IN-Media in 2005, which found over 90% of local bloggers were aged 16-35 [<xref ref-type="bibr" rid="ref43">43</xref>]. Infodemiology using blog searching data is therefore useful for studying important health issues among Hong Kong adolescents and adults, such as alcohol use.</p>
                <p>There are different methods of blog analysis. Some (eg, time series scanning, semantic analysis) require special software and significant investment of time and computing resources [<xref ref-type="bibr" rid="ref35">35</xref>]. This has greatly reduced its practicability in public health research done by clinicians who might not otherwise know much about computer programming. On the other hand, blog searching using blog search engines, which are freely available online, provides a technically easy, straightforward, and user-friendly method to extract data from blogs. Unlike Web search engines, blog search engines mainly index blog posts and are dedicated to searching information from blog posts only, ignoring the rest of the database [<xref ref-type="bibr" rid="ref44">44</xref>]. Since each blog post is time-stamped, a blog search engine could search for date-specific blog posts, allowing longitudinal blog tracking, even retrospectively.</p>
                <p>Local public health research using blog search and Chinese keywords is rarely done at the moment. Should blog searching data be correlated with local epidemiological data, clinicians (and policy makers) could readily replace traditional surveillance methods with blog searching&#8212;which is real-time, cheap, and fast&#8212;for public health tracking. Even if there is no correlation, an explanatory study like this would still contribute to the development of health informatics by demonstrating the challenges of Chinese blog searches in an otherwise English-dominated research environment. The clear rise of alcohol consumption in Hong Kong due to zero beer and wine tax provides a sound framework under which blog searching data can be validated against local epidemiology.</p>
            </sec>
            <sec>
                <title>Study Objectives and Hypotheses</title>
                <p>Using currently available search tools and Web resources, this study aimed to: (1) assess and explain the online use of alcohol-related Chinese keywords, and (2) validate blog searching as an infoveillance method to survey changes in the drinking patterns (eg, alcohol type) of Hong Kong people (represented by bloggers in a Hong Kong&#8211;based Chinese blog service provider) following changes to the beer and wine tax in 2007-8.</p>
                <p>Following are the hypotheses of this study:</p>
                <p>(H1) The online popularity of alcohol-related concepts, in particular &#8220;beer or wine&#8221;, increased among Chinese bloggers after 2007-8 when local tax policy on beer or wine changed.</p>
                <p>(H2) Infodemiological data (represented by prevalence rate and ratio of alcohol-related concepts) correlated significantly with local epidemiological data (represented by per capita alcohol consumption).</p>
            </sec>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <sec>
                <title>Study Design</title>
                <p>To the best of our knowledge, this was the first research done in Hong Kong using blog searches to study a public health&#8211;related topic. The issue of alcohol drinking was chosen because of its public health interest and clear impacts by tax policy changes. Blogs were targeted for data extraction because regional interest could be maximized by choosing a blog service provider with the highest local rank and visitors, unlike other social networking sites such as Twitter or Facebook, which tend to cover a wide geographical area.</p>
                <p>There were two main sets of data in this study: (1) infodemiology and (2) epidemiology. Infodemiological data stemmed from existing blogs indexed by a specific search engine, whereas epidemiological data were obtained from government documents covering the issues of public health. To reduce expertise and technology investment, this study used a free Web-based blog search engine, Google Blog Search, to extract data from the archives of a Hong Kong&#8211;based blog service provider, MySinaBlog, from 2005-2010. Three groups of Chinese keywords were used, each representing a specific alcohol-related concept. They were (1) &#8220;alcohol&#8221; (ie, the control concept), (2) &#8220;beer or wine&#8221;, and (3) &#8220;spirit&#8221;. The resulting blog posts were analyzed quantitatively using infodemiological metrics and correlation coefficients, and qualitatively by manual effort. The infodemiological metrics were (1) apparent prevalence, (2) actual prevalence, (3) prevalence rate, and (4) prevalence ratio. Pearson and Spearman correlations were calculated for prevalence rates and ratios with respect to per capita alcohol consumption in the same years. Manual analysis included (1) blog author characteristics (ie, authorship, sex, and age), and (2) blog content (ie, frequency of keywords, description of a discrete episode of alcohol drinking, drinking amount, and genres). The prevalence rate and ratio were used to assess the online popularity of alcohol-related concepts, whereas the correlation analysis and manual analysis were used to validate blog searching data as an infoveillance method for population survey.</p>
            </sec>
            <sec>
                <title>Collection of Infodemiological Data</title>
                <sec>
                    <title>Blog Service Provider</title>
                    <p>The online database of the blog service provider enabled search tasks and collection of infodemiological data. Inclusion criteria were (1) free of charge, (2) currently under service, and (3) last updated in or after 2010. As such, 19 blogging sites were enlisted from 852.com [<xref ref-type="bibr" rid="ref45">45</xref>], which was a Hong Kong-based Web directory, and TopTenREVIEWS [<xref ref-type="bibr" rid="ref46">46</xref>], a media review website. Their online traffic data were obtained from two Web information companies, Alexa Internet [<xref ref-type="bibr" rid="ref47">47</xref>] and StatsCrop [<xref ref-type="bibr" rid="ref48">48</xref>], shown in <xref ref-type="table" rid="table1">Table 1</xref>. They were excluded if (1) the only available figures were from their non-blog domain server, or (2) data were not available. The rest were compared in terms of their local popularity (measured by Alexa traffic rank in Hong Kong and percentage of daily visitors from Hong Kong) and primary country/server location to maximize the regional interest. MySinaBlog, a Hong Kong-based blog service provider with a local rank of 201 and more than half of its visitors from Hong Kong, was eventually selected.</p>
                    <table-wrap position="float" id="table1">
                        <label>Table 1</label>
                        <caption>
                            <p>Alexa traffic rank in Hong Kong, percentage of daily visitors from Hong Kong, and primary country<sup>a</sup> of selected free blogging sites (as on April 12, 2013).</p>
                        </caption>
                        <table width="617" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                            <col width="180" />
                            <col width="101" />
                            <col width="139" />
                            <col width="138" />
                            <thead>
                                <tr valign="top">
                                    <td>URL</td>
                                    <td>Alexa traffic rank in Hong Kong</td>
                                    <td>Percentage of daily visitors from Hong Kong</td>
                                    <td>Primary country</td>
                                </tr>
                            </thead>
                            <tbody>
                                <tr valign="top">
                                    <td>blogcity.me</td>
                                    <td>1145</td>
                                    <td>74.2</td>
                                    <td>Hong Kong</td>
                                </tr>
                                <tr valign="bottom">
                                    <td>blog.mingpao.com</td>
                                    <td>94<sup>b</sup>
                                    </td>
                                    <td>56.8<sup>b</sup>
                                    </td>
                                    <td>Hong Kong</td>
                                </tr>
                                <tr valign="bottom">
                                    <td>blog.yahoo.com/explorer/hk</td>
                                    <td>4<sup>b</sup>
                                    </td>
                                    <td>0.8<sup>b</sup>
                                    </td>
                                    <td>United States</td>
                                </tr>
                                <tr valign="top">
                                    <td>hk.xanga.com</td>
                                    <td>571</td>
                                    <td>5.4</td>
                                    <td>United States</td>
                                </tr>
                                <tr valign="top">
                                    <td>lifestream.aol.com</td>
                                    <td>Data not available</td>
                                    <td>Data not available</td>
                                    <td>United States</td>
                                </tr>
                                <tr valign="top">
                                    <td>mysinablog.com</td>
                                    <td>201</td>
                                    <td>50.8</td>
                                    <td>Hong Kong</td>
                                </tr>
                                <tr valign="top">
                                    <td>qooza.hk</td>
                                    <td>417</td>
                                    <td>35.7</td>
                                    <td>Hong Kong</td>
                                </tr>
                                <tr valign="top">
                                    <td>showhappy.net</td>
                                    <td>Data not available</td>
                                    <td>Data not available</td>
                                    <td>United States</td>
                                </tr>
                                <tr valign="top">
                                    <td>spaces.live.com</td>
                                    <td>Data not available</td>
                                    <td>Data not available</td>
                                    <td>Iran</td>
                                </tr>
                                <tr valign="bottom">
                                    <td>space.gogo.la</td>
                                    <td>1352<sup>b</sup>
                                    </td>
                                    <td>67.0<sup>b</sup>
                                    </td>
                                    <td>Hong Kong</td>
                                </tr>
                                <tr valign="bottom">
                                    <td>space.uwants.com/html/blog.html</td>
                                    <td>22<sup>b</sup>
                                    </td>
                                    <td>57.4<sup>b</sup>
                                    </td>
                                    <td>Hong Kong</td>
                                </tr>
                                <tr valign="top">
                                    <td>wordpress.com</td>
                                    <td>Data not available</td>
                                    <td>Data not available</td>
                                    <td>United States</td>
                                </tr>
                                <tr valign="top">
                                    <td>www.blogger.com</td>
                                    <td>Data not available</td>
                                    <td>Data not available</td>
                                    <td>India</td>
                                </tr>
                                <tr valign="top">
                                    <td>www.ezhk.net</td>
                                    <td>Data not available</td>
                                    <td>Data not available</td>
                                    <td>Hong Kong</td>
                                </tr>
                                <tr valign="bottom">
                                    <td>www.hkflash.com/diary</td>
                                    <td>7012<sup>b</sup>
                                    </td>
                                    <td>25.6<sup>b</sup>
                                    </td>
                                    <td>South Korea</td>
                                </tr>
                                <tr valign="top">
                                    <td>www.livejournal.com</td>
                                    <td>Data not available</td>
                                    <td>Data not available</td>
                                    <td>Russia</td>
                                </tr>
                                <tr valign="top">
                                    <td>www.mocasting.com</td>
                                    <td>16,435</td>
                                    <td>51.8</td>
                                    <td>China</td>
                                </tr>
                                <tr valign="top">
                                    <td>www.myspace.com</td>
                                    <td>Data not available</td>
                                    <td>Data not available</td>
                                    <td>United States</td>
                                </tr>
                                <tr valign="top">
                                    <td>www6.mobichai.com/blog</td>
                                    <td>Data not available</td>
                                    <td>Data not available</td>
                                    <td>Hong Kong</td>
                                </tr>
                            </tbody>
                        </table>
                        <table-wrap-foot>
                            <fn id="table1fn1">
                                <p>
                                    <sup>a</sup>Or server location if the primary country was not known.</p>
                            </fn>
                            <fn id="table1fn2">
                                <p>
                                    <sup>b</sup>Representing the only available data from its non-blog domain server.</p>
                            </fn>
                        </table-wrap-foot>
                    </table-wrap>
                </sec>
                <sec>
                    <title>Blog Search Engine and Search Query</title>
                    <p>The capabilities and limitations of 11 blog search engines were compared in one study by Thelwall [<xref ref-type="bibr" rid="ref44">44</xref>]. Among them, Google Blog Search was the only one equipped with all of the following features: (1) full Boolean search, (2) user-specified date or date range search, (3) URL search, (4) language selection, and (5) word location. It was therefore employed in the present study.</p>
                    <p>In each search query, the following were included: (1) alcohol-related Chinese keywords connected by the Boolean operator &#8220;OR&#8221;, and (2) URL of the blog service provider expressed as &#8220;site:mysinablog.com&#8221;. To obtain the total number of blog posts, the keywords were substituted by a space. The date was specified as January 1 to December 31 of each year from 2005-2010. The timeframe was so decided because MySinaBlog started to run their service in 2005 [<xref ref-type="bibr" rid="ref49">49</xref>], and epidemiological data regarding alcohol consumption per capita in Hong Kong was only up to 2010 [<xref ref-type="bibr" rid="ref4">4</xref>]. The search results (ie, number of matched blog posts) were taken for infodemiology analysis.</p>
                </sec>
                <sec>
                    <title>Alcohol-Related Concepts and Keywords</title>
                    <sec>
                        <title>Overview</title>
                        <p>Specific groups of alcohol-related keywords formed the basis of blog searching in this study. Each group corresponded to a concept and comprised multiple keywords connected by the Boolean operator &#8220;OR&#8221; (which would return blog posts containing any of the search terms) to explore the same concept, as suggested by Eysenbach in his framework on infodemiology and infoveillance [<xref ref-type="bibr" rid="ref14">14</xref>]. The concepts were (1) &#8220;alcohol&#8221;, (2) &#8220;beer or wine&#8221;, and (3) &#8220;spirit&#8221;. They were chosen because beer and wine contained an alcohol strength of not more than 30%, and it was upon this group of liquors that the HKSAR Government halved the duty in 2007 and then abolished it in 2008. To better compare the concepts of &#8220;beer or wine&#8221; and &#8220;spirit&#8221;, &#8220;alcohol&#8221; was chosen as the control (ie, the broader) concept to calculate the prevalence ratios, in addition to the prevalence rates.</p>
                        <p>
                            <xref ref-type="fig" rid="figure1">Figure 1</xref> shows the concepts and keywords that were typed into the search field. All keywords were in traditional Chinese, which was more often used than simplified Chinese or English in Hong Kong. Compared to using keywords in both Chinese and English, it could (1) enhance the homogeneity of the output data, and (2) reduce the size of the output data to ease subsequent manual analysis.</p>
                    </sec>
                    <sec>
                        <title>Keyword &#8220;Alcohol&#8221;</title>
                        <p>The English word &#8220;alcohol&#8221; was translated to Chinese using Lin Yutang&#8217;s Chinese-English Dictionary of Modern Usage (Online Version) [<xref ref-type="bibr" rid="ref50">50</xref>]. In general, two or more Chinese characters made up a Chinese word. Different Chinese words might share the same meaning, whereas some Chinese words might have more than one meanings. To reduce confusion and widen the search coverage, only the Chinese character  shown in <xref ref-type="fig" rid="figure1">Figure 1</xref> was used for alcohol, instead of other Chinese words with the same meaning. It should be noted, however, that some Chinese translations were simply taken from the phonics in English without including the Chinese character for alcohol (eg, champagne, whisky, brandy). It would be impossible (and impractical) to guarantee a full coverage of the search results for all kinds of beer, wine, and spirit using the single Chinese character for alcohol shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>. Nonetheless, it already provided the largest inclusion as a control concept of this study.</p>
                    </sec>
                    <sec>
                        <title>Keywords &#8220;Beer or Wine&#8221; and &#8220;Spirit&#8221;</title>
                        <p>Keywords that belonged to the concepts &#8220;beer or wine&#8221; and &#8220;spirit&#8221; were chosen from a document released by the Customs and Excise Department of the HKSAR Government [<xref ref-type="bibr" rid="ref51">51</xref>], which related to the budget proposals about changes in the beer and wine tax. They contrasted the impacts brought about by the tax policy. Generic terms with variable alcoholic strength were excluded (eg, sake, sugar spirit, reprocessing Chinese liquor). The rest were categorized under &#8220;beer or wine&#8221; if the alcohol strength was not more than 30%, or &#8220;spirit&#8221; if otherwise.</p>
                        <fig id="figure1" position="float">
                            <label>Figure 1</label>
                            <caption>
                                <p>Alcohol-related concepts and their corresponding Chinese keywords typed into the search field.</p>
                            </caption>
                            <graphic xlink:href="jmir_v15i9e192_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                        </fig>
                    </sec>
                </sec>
            </sec>
            <sec>
                <title>Collection of Epidemiological Data</title>
                <p>
                    <xref ref-type="table" rid="table2">Table 2</xref> shows the per capita alcohol consumption extracted from a report released by the Department of Health of the HKSAR Government in 2011 [<xref ref-type="bibr" rid="ref4">4</xref>]. It was adopted in our study because it was (1) freely accessible, (2) presented in a longitudinal form, and (3) subgrouped according to alcohol types. Data from 2011 were not available, and no updates of the data were seen hitherto.</p>
            </sec>
            <sec>
                <title>Quantitative Analysis</title>
                <sec>
                    <title>Infodemiological Metrics: Apparent Prevalence, Actual Prevalence, Prevalence Rate, and Prevalence Ratio</title>
                    <p>Eysenbach advocated the use of relative indicators such as rates and ratios in lieu of absolute figures to represent information prevalence since the number of websites was constantly changing [<xref ref-type="bibr" rid="ref15">15</xref>]. With slight modifications of his proposal, the following infodemiological metrics were used to indicate the online popularity of the concepts in blog posts: (1) apparent prevalence, (2) actual prevalence, (3) prevalence rate, and (4) prevalence ratio. The definitions/formulae of the metrics are shown in <xref ref-type="fig" rid="figure2">Figure 2</xref>. The apparent prevalence referred to an estimate by the blog search engine, and the actual prevalence was confirmed by the researcher who did the counting while accessing each website. The apparent prevalence instead of actual prevalence was used to calculate the prevalence rate because the total number of blog posts was again an estimate by the blog search engine. Similarly, the prevalence ratio was calculated using apparent prevalence instead of actual prevalence to avoid confusion in the correlation analysis.</p>
                    <table-wrap position="float" id="table2">
                        <label>Table 2</label>
                        <caption>
                            <p>Total and per capita alcohol consumption in Hong Kong from 2005-2010 (adapted from the Department of Health of the HKSAR Government).</p>
                        </caption>
                        <table width="617" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                            <col width="42" />
                            <col width="88" />
                            <col width="109" />
                            <col width="88" />
                            <col width="88" />
                            <col width="115" />
                            <thead>
                                <tr valign="top">
                                    <td rowspan="2">Year</td>
                                    <td colspan="2">Total pure alcohol consumption (in liters)</td>
                                    <td rowspan="2">Population aged &#8805;15 years</td>
                                    <td colspan="2">Per capita alcohol consumption (in liters)</td>
                                </tr>
                                <tr valign="top">
                                    <td>Beer and wine</td>
                                    <td>Spirit</td>
                                    <td>Beer and wine</td>
                                    <td>Spirit</td>
                                </tr>
                            </thead>
                            <tbody>
                                <tr valign="top">
                                    <td>2005</td>
                                    <td>9,382,633</td>
                                    <td>5,376,813</td>
                                    <td>5,844,300</td>
                                    <td>1.61</td>
                                    <td>0.92</td>
                                </tr>
                                <tr valign="top">
                                    <td>2006</td>
                                    <td>9,442,114</td>
                                    <td>5,586,247</td>
                                    <td>5,918,000</td>
                                    <td>1.60</td>
                                    <td>0.94</td>
                                </tr>
                                <tr valign="top">
                                    <td>2007</td>
                                    <td>9,878,382</td>
                                    <td>5,927,246</td>
                                    <td>6,004,700</td>
                                    <td>1.65</td>
                                    <td>0.99</td>
                                </tr>
                                <tr valign="top">
                                    <td>2008</td>
                                    <td>12,309,905</td>
                                    <td>5,946,634</td>
                                    <td>6,075,400</td>
                                    <td>2.03</td>
                                    <td>0.98</td>
                                </tr>
                                <tr valign="top">
                                    <td>2009</td>
                                    <td>11,973,446</td>
                                    <td>4,244,254</td>
                                    <td>6,130,300</td>
                                    <td>1.95</td>
                                    <td>0.69</td>
                                </tr>
                                <tr valign="top">
                                    <td>2010</td>
                                    <td>11,252,645</td>
                                    <td>5,156,867</td>
                                    <td>6,209,800</td>
                                    <td>1.81</td>
                                    <td>0.83</td>
                                </tr>
                            </tbody>
                        </table>
                    </table-wrap>
                    <fig id="figure2" position="float">
                        <label>Figure 2</label>
                        <caption>
                            <p>Definitions/formulae of the infodemiological metrics.</p>
                        </caption>
                        <graphic xlink:href="jmir_v15i9e192_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                </sec>
                <sec>
                    <title>Pearson and Spearman Correlations</title>
                    <p>A correlation analysis was done to validate the use of infodemiological data in surveying the drinking patterns of the local population, as shown in <xref ref-type="table" rid="table3">Table 3</xref>. Essentially, the infodemiological data (ie, prevalence rates and ratios) acted as the independent variable whereas the epidemiological data (ie, per capita alcohol consumption) acted as the dependent variable. Pearson and Spearman correlations were calculated using the Statistical Package for the Social Sciences (SPSS).</p>
                </sec>
            </sec>
            <sec>
                <title>Qualitative Analysis</title>
                <p>Once blog searching was done, the blog posts were saved in .html files for subsequent analysis to avoid discrepancy due to time lag. The manual analysis focused on (1) blog author characteristics (ie, authorship, sex, and age), and (2) blog content (ie, frequency of keywords, description of a discrete episode of alcohol drinking, drinking amount, and genres). They would provide further information about the validity of utilizing blog searching data in an epidemiological survey. Their subcategories and criteria are listed in <xref ref-type="table" rid="table4">Table 4</xref>.</p>
                <p>Blog posts with &#8220;alcohol&#8221; keywords were not included for manual analysis since a large portion of them were expected to overlap with those that contained &#8220;beer or wine&#8221; and &#8220;spirit&#8221; keywords. They might not be particularly helpful in analyzing the drinking pattern (eg, choice of alcohol) of the population.</p>
                <p>It was noteworthy that most of the free text analytic tools did not support Chinese language and had no way to identify position of the keywords within a blog (eg, header, main body, sidebar, footer, and comment). Currently available concordancers for Chinese language were not too user-friendly as they lacked an external encoder/decoder, keyword-in-context (KWIC) format, or built-in dictionaries for semantic analysis or opinion mining [<xref ref-type="bibr" rid="ref52">52</xref>]. This was why manual analysis was chosen in this study as a preliminary measure to explore the blog author characteristics and blog content.</p>
                <table-wrap position="float" id="table3">
                    <label>Table 3</label>
                    <caption>
                        <p>Correlation of infodemiological and epidemiological data.</p>
                    </caption>
                    <table width="617" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="278" />
                        <col width="309" />
                        <thead>
                            <tr valign="top">
                                <td>Infodemiological data</td>
                                <td>Epidemiological data</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>&#8220;alcohol&#8221; prevalence rate</td>
                                <td>Per capita consumption of all alcoholic types</td>
                            </tr>
                            <tr valign="top">
                                <td>&#8220;beer or wine&#8221; prevalence rate</td>
                                <td>Per capita consumption of beer and wine</td>
                            </tr>
                            <tr valign="top">
                                <td>&#8220;spirit&#8221; prevalence rate</td>
                                <td>Per capita consumption of spirits</td>
                            </tr>
                            <tr valign="top">
                                <td>&#8220;beer or wine&#8221; / &#8220;alcohol&#8221; prevalence ratio</td>
                                <td>Per capita consumption of beer and wine</td>
                            </tr>
                            <tr valign="top">
                                <td>&#8220;spirit&#8221; / &#8220;alcohol&#8221; prevalence ratio</td>
                                <td>Per capita consumption of spirits</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap position="float" id="table4">
                    <label>Table 4</label>
                    <caption>
                        <p>Categories, subcategories, and criteria for manual analysis of blog posts containing &#8220;beer or wine&#8221; and &#8220;spirit&#8221; keywords in MySinaBlog from 2005-2010.</p>
                    </caption>
                    <table width="617" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="193" />
                        <col width="394" />
                        <thead>
                            <tr valign="top">
                                <td>Categories</td>
                                <td>Subcategories</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Authorship</td>
                                <td>(1) Single author, or (2) multiple authors</td>
                            </tr>
                            <tr valign="top">
                                <td>Sex</td>
                                <td>(1) Female, (2) male, or (3) unknown</td>
                            </tr>
                            <tr valign="top">
                                <td>Age</td>
                                <td>(1) Below 18 years old, (2) 18 years old and above, or (3) unknown</td>
                            </tr>
                            <tr valign="top">
                                <td>Frequency of keywords</td>
                                <td>Not applicable</td>
                            </tr>
                            <tr valign="top">
                                <td>Description of a discrete episode of alcohol drinking</td>
                                <td>(1) Yes, or (2) no</td>
                            </tr>
                            <tr valign="top">
                                <td>Drinking amount</td>
                                <td>(1) Binge drinking, (2) non-binge drinking, and (3) undetermined</td>
                            </tr>
                            <tr valign="top">
                                <td>Genres</td>
                                <td>(1) Name of a place/person/entity not belonging to alcohol, eg, lyrics, (2) recipe/dish name, (3) news/copied article from an external source, (4) story narrative/film synopsis, (5) health/educational information, (6) non-opinionated featured article, (7) personal diary/opinion/emotional outlet, or (8) more than one of the above</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <sec>
                <title>Overview</title>
                <p>The blog search was done on April 12, 2013, and the manual analysis was completed by researcher, KL Chan, in the subsequent week. The results are described below.</p>
            </sec>
            <sec>
                <title>Quantitative and Correlation Analysis</title>
                <sec>
                    <title>Apparent and Actual Prevalence</title>
                    <p>
                        <xref ref-type="table" rid="table5">Table 5</xref> shows that the total number of blog posts in MySinaBlog increased dramatically within 5 years&#8217; time, from less than 500 in 2005 to more than 20,000 in 2010. An increasing trend was also observed for the apparent prevalence of &#8220;alcohol&#8221;, &#8220;beer or wine&#8221;, and &#8220;spirit&#8221; except in 2010 when that of &#8220;beer or wine&#8221; and &#8220;spirit&#8221; dropped compared to the year before.</p>
                    <p>The apparent prevalence of &#8220;alcohol&#8221; was consistently higher than that of &#8220;beer or wine&#8221; and &#8220;spirit&#8221;, which made sense as &#8220;alcohol&#8221; was the control concept. However, in 2005 the apparent prevalence of &#8220;alcohol&#8221; was only 3, compared to that of &#8220;beer or wine&#8221;, which was 5. This might be explained by translation difficulties where the Chinese character of &#8220;alcohol&#8221; did not cover all keywords of &#8220;beer or wine&#8221; and &#8220;spirit&#8221;. On the other hand, the apparent prevalence of &#8220;beer or wine&#8221; was higher than that of &#8220;spirits&#8221; in 2005-2007 and 2010. In 2008 however, the two were equal, and in 2009, the apparent prevalence of &#8220;spirit&#8221; surpassed that of &#8220;beer or wine&#8221; by a difference of 17.</p>
                    <p>The discrepancies between apparent and actual prevalence became more obvious when their values enlarged in all three concepts. For example, the apparent prevalence of &#8220;alcohol&#8221; in 2005 was 3 and was the same as the actual prevalence; but in 2006, as the former increased to 26, the two differed by 12. By the time the apparent prevalence of &#8220;alcohol&#8221; reached up to 1390 in 2010, the actual prevalence of &#8220;alcohol&#8221; was only 195, representing a difference of 1195. Of particular note, the actual prevalence of &#8220;spirits&#8221; of 12 in 2008 and 13 in 2009 was much lower than its apparent prevalence of 73 and 115, respectively, due to spams in blogs. The trends of the apparent and actual prevalence were grossly symmetrical for &#8220;alcohol&#8221; and &#8220;beer or wine&#8221; except that in 2010, the actual prevalence of &#8220;beer or wine&#8221; peaked instead of waning.</p>
                    <table-wrap position="float" id="table5">
                        <label>Table 5</label>
                        <caption>
                            <p>Total number of blog post, apparent and actual prevalence of alcohol-related concepts in MySinaBlog from 2005-2010.</p>
                        </caption>
                        <table width="617" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                            <col width="62" />
                            <col width="151" />
                            <col width="111" />
                            <col width="111" />
                            <col width="110" />
                            <thead>
                                <tr valign="top">
                                    <td rowspan="2">Year</td>
                                    <td rowspan="2">Total number of blog posts</td>
                                    <td colspan="3">Apparent prevalence (actual prevalence)</td>
                                </tr>
                                <tr valign="top">
                                    <td>&#8220;Alcohol&#8221;</td>
                                    <td>&#8220;Beer or wine&#8221;</td>
                                    <td>&#8220;Spirit&#8221;</td>
                                </tr>
                            </thead>
                            <tbody>
                                <tr valign="top">
                                    <td>2005</td>
                                    <td>394</td>
                                    <td>3 (3)</td>
                                    <td>5 (5)</td>
                                    <td>0 (0)</td>
                                </tr>
                                <tr valign="top">
                                    <td>2006</td>
                                    <td>1810</td>
                                    <td>26 (14)</td>
                                    <td>16 (15)</td>
                                    <td>3 (3)</td>
                                </tr>
                                <tr valign="top">
                                    <td>2007</td>
                                    <td>5620</td>
                                    <td>120 (59)</td>
                                    <td>27 (15)</td>
                                    <td>5 (5)</td>
                                </tr>
                                <tr valign="bottom">
                                    <td>2008</td>
                                    <td>11,500</td>
                                    <td>1180 (150<sup>a</sup>)</td>
                                    <td>73 (28)</td>
                                    <td>73 (12<sup>a,b</sup>)</td>
                                </tr>
                                <tr valign="bottom">
                                    <td>2009</td>
                                    <td>16,000</td>
                                    <td>1290 (190<sup>a</sup>)</td>
                                    <td>98 (25)</td>
                                    <td>115 (13<sup>a,b</sup>)</td>
                                </tr>
                                <tr valign="bottom">
                                    <td>2010</td>
                                    <td>20,400</td>
                                    <td>1390 (195)</td>
                                    <td>70 (41<sup>c</sup>)</td>
                                    <td>3 (3)</td>
                                </tr>
                            </tbody>
                        </table>
                        <table-wrap-foot>
                            <fn id="table6fn1">
                                <p>
                                    <sup>a</sup>Final figures included those blog posts that were initially hidden and prompted by the blog search engine.</p>
                            </fn>
                            <fn id="table6fn2">
                                <p>
                                    <sup>b</sup>After excluding blogs with spams that actually contained no keywords.</p>
                            </fn>
                            <fn id="table6fn3">
                                <p>
                                    <sup>c</sup>After excluding one blog post that was inaccessible due to security reasons.</p>
                            </fn>
                        </table-wrap-foot>
                    </table-wrap>
                </sec>
                <sec>
                    <title>Prevalence Rate and Correlation Coefficients</title>
                    <p>
                        <xref ref-type="table" rid="table6">Table 6</xref> shows that the prevalence rate of &#8220;alcohol&#8221; followed an inverted V shape, increasing steadily from 0.76% in 2005 to 2.14% in 2007, peaking at 10.26% in 2008, and decreasing to 8.06% in 2009 and then to 6.81% in 2010. The prevalence rate of &#8220;beer or wine&#8221; declined over the years with its first trough of 0.48% in 2007 and second trough of 0.34% in 2010. The prevalence rate of &#8220;spirit&#8221; was quite the opposite, initially hovering at a low level of 0% to 0.17% in 2005-2007, then surging up to 0.72% in 2008-2009, and eventually falling back to 0.01% in 2010.</p>
                    <p>The prevalence rate of &#8220;alcohol&#8221; was consistently higher than that of &#8220;beer or wine&#8221; and &#8220;spirit&#8221; except in 2005 when the prevalence rate of &#8220;alcohol&#8221; was only 0.76%, compared to that of &#8220;beer or wine&#8221;, which was 1.27%. This might be explained by translation difficulties as stated before. The prevalence rate of &#8220;spirit&#8221; was the lowest among all three concepts in 2005-2007 and 2010. However, in 2008, it tied with the prevalence rate of &#8220;beer or wine&#8221;, and in 2009, exceeded it altogether.</p>
                    <p>Per capita consumption of alcohol correlated strongly with the prevalence rate of &#8220;alcohol&#8221; (Pearson correlation=0.81, <italic>P</italic>=.05; Spearman correlation=1.00, <italic>P</italic>&#60;.001). The linear relationship was marginally significant and the nonlinear relationship was significant. The prevalence rate of &#8220;beer or wine&#8221; was negatively and moderately correlated with per capita consumption of beer and wine (Pearson correlation=-0.48, <italic>P</italic>=.34; Spearman correlation=-0.43, <italic>P</italic>=.40). Both were nonsignificant. Similarly, the prevalence rate of &#8220;spirit&#8221; had a moderate negative linear correlation (Pearson correlation=-0.40, <italic>P</italic>=.43) and a weak negative nonlinear correlation (Spearman correlation=-0.09, <italic>P</italic>=.87) with per capita consumption of spirits. Again, both were nonsignificant.</p>
                </sec>
                <sec>
                    <title>Prevalence Ratio and Correlation Coefficients</title>
                    <p>
                        <xref ref-type="table" rid="table7">Table 7</xref> shows that the prevalence ratio of &#8220;beer or wine&#8221; / &#8220;alcohol&#8221; declined as a whole, troughing at 0.06 in 2008 and 0.05 in 2010. The prevalence ratio of &#8220;spirit&#8221; / &#8220;alcohol&#8221;, on the other hand, peaked at 0.12 in 2006 and 0.09 in 2009. The former was higher in 2005-2007 and 2010. However, in 2008, the two tied, and in 2009, the prevalence ratio of &#8220;spirit&#8221; / &#8220;alcohol&#8221; reached 0.09, surpassing that of 0.08 for &#8220;beer or wine&#8221; / &#8220;alcohol&#8221;.</p>
                    <p>The prevalence ratio of &#8220;beer or wine&#8221; / &#8220;alcohol&#8221; had a strong negative correlation with per capita consumption of beer and wine (Pearson correlation=-0.65, <italic>P</italic>=.16; Spearman correlation=-0.77, <italic>P</italic>=.07). The correlation coefficients were nonsignificant. The prevalence ratio of &#8220;spirit&#8221; / &#8220;alcohol&#8221; was also negatively correlated with per capita consumption of spirits but only weakly (Pearson correlation=-0.10, <italic>P</italic>=.85; Spearman correlation=-0.03, <italic>P</italic>=.96). Again, both correlation coefficients were nonsignificant.</p>
                    <table-wrap position="float" id="table6">
                        <label>Table 6</label>
                        <caption>
                            <p>Prevalence rate of alcohol-related concepts in MySinaBlog and correlation coefficients compared with per capita consumption of the same alcohol types in Hong Kong from 2005-2010.</p>
                        </caption>
                        <table width="617" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                            <col width="186" />
                            <col width="75" />
                            <col width="91" />
                            <col width="98" />
                            <col width="95" />
                            <thead>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td colspan="3">Prevalence rate (%)</td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>&#8220;Alcohol&#8221;</td>
                                    <td>&#8220;Beer or wine&#8221;</td>
                                    <td>&#8220;Spirit&#8221;</td>
                                </tr>
                            </thead>
                            <tbody>
                                <tr valign="top">
                                    <td>
                                        <bold>Year</bold>
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>2005</td>
                                    <td>0.76</td>
                                    <td>1.27</td>
                                    <td>0</td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>2006</td>
                                    <td>1.44</td>
                                    <td>0.88</td>
                                    <td>0.17</td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>2007</td>
                                    <td>2.14</td>
                                    <td>0.48</td>
                                    <td>0.09</td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>2008</td>
                                    <td>10.26</td>
                                    <td>0.63</td>
                                    <td>0.63</td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>2009</td>
                                    <td>8.06</td>
                                    <td>0.61</td>
                                    <td>0.72</td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>2010</td>
                                    <td>6.81</td>
                                    <td>0.34</td>
                                    <td>0.01</td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <bold>Correlation coefficients (<italic>P value</italic>)</bold>
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>Pearson</td>
                                    <td>0.81 (.05)</td>
                                    <td>-0.48 (.34)</td>
                                    <td>-0.40 (.43)</td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>Spearman</td>
                                    <td>1.00 (&#60;.001)</td>
                                    <td>-0.43 (.40)</td>
                                    <td>-0.09 (.87)</td>
                                </tr>
                            </tbody>
                        </table>
                    </table-wrap>
                    <table-wrap position="float" id="table7">
                        <label>Table 7</label>
                        <caption>
                            <p>Prevalence ratios of alcohol-related concepts in MySinaBlog and correlation coefficients compared with per capita consumption of the same alcohol types in Hong Kong from 2005-2010.</p>
                        </caption>
                        <table width="617" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                            <col width="170" />
                            <col width="63" />
                            <col width="176" />
                            <col width="150" />
                            <thead>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td colspan="2">Prevalence ratio (%)</td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>&#8220;Beer or wine&#8221; / &#8220;alcohol&#8221;</td>
                                    <td>&#8220;Spirit&#8221; / &#8220;alcohol&#8221;</td>
                                </tr>
                            </thead>
                            <tbody>
                                <tr valign="top">
                                    <td>
                                        <bold>Year</bold>
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                </tr>
                                <tr valign="top">
                                    <td rowspan="6">
                                        <break />
                                    </td>
                                    <td>2005</td>
                                    <td>1.67</td>
                                    <td>0</td>
                                </tr>
                                <tr valign="top">
                                    <td>2006</td>
                                    <td>0.62</td>
                                    <td>0.12</td>
                                </tr>
                                <tr valign="top">
                                    <td>2007</td>
                                    <td>0.23</td>
                                    <td>0.04</td>
                                </tr>
                                <tr valign="top">
                                    <td>2008</td>
                                    <td>0.06</td>
                                    <td>0.06</td>
                                </tr>
                                <tr valign="top">
                                    <td>2009</td>
                                    <td>0.08</td>
                                    <td>0.09</td>
                                </tr>
                                <tr valign="top">
                                    <td>2010</td>
                                    <td>0.05</td>
                                    <td>0.00</td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <bold>Correlation coefficients (<italic>P value</italic>)</bold>
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                    <td>
                                        <break />
                                    </td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>Pearson</td>
                                    <td>-0.65 (.16)</td>
                                    <td>-0.10 (.85)</td>
                                </tr>
                                <tr valign="top">
                                    <td>
                                        <break />
                                    </td>
                                    <td>Spearman</td>
                                    <td>-0.77 (.07)</td>
                                    <td>-0.03 (.96)</td>
                                </tr>
                            </tbody>
                        </table>
                    </table-wrap>
                </sec>
            </sec>
            <sec>
                <title>Qualitative Analysis</title>
                <sec>
                    <title>Blog Author Characteristics</title>
                    <p>
                        <xref ref-type="fig" rid="figure3">Figure 3</xref> illustrates that a substantial number of blogs with alcohol-related keywords in MySinaBlog from 2005-2010 were written by single authors (97.1%, 134/138). For those single authors whose sex identity was known, their sex distribution was equal (female=38.1%, 51/134; male=38.1%, 51/134; unknown=23.9%, 32/134) (<xref ref-type="fig" rid="figure4">Figure 4</xref>). Most single authors also did not indicate their age (unknown age=75.4%, 101/134), while the rest were mostly adults (18 years old or above=22.4%, 30/134) (<xref ref-type="fig" rid="figure5">Figure 5</xref>). All parameters appeared to increase with time, possibly explained by the increase in the total number of blogs.</p>
                </sec>
                <sec>
                    <title>Blog Content</title>
                    <p>As shown in <xref ref-type="fig" rid="figure6">Figures 6</xref> and <xref ref-type="fig" rid="figure7">7</xref>, not all alcohol-related keywords were found in the blog posts of MySinaBlog in 2005-2010. Among &#8220;beer or wine&#8221; keywords, &#8220;beer&#8221; was the most common. It had an accumulated frequency of 324 from 2005-2010 and peaked at a point frequency of 153 in 2010. &#8220;Champagne&#8221; was the second most common, followed by &#8220;port wine&#8221;, and lastly &#8220;perry&#8221;. As for &#8220;spirit&#8221; keywords, &#8220;whisky&#8221; was the most common. It had an accumulated frequency of 67 from 2005-2010 and peaked at a point frequency of 21 in 2010. &#8220;Rum&#8221; was the second most common, followed by &#8220;brandy&#8221;, and lastly &#8220;vodka&#8221;. The point frequency of the keywords seemed to rise over the years, possibly explained by an increase in the actual prevalence of the blog posts.</p>
                    <p>As shown in <xref ref-type="fig" rid="figure8">Figure 8</xref>, not all blog posts actually described a discrete episode of alcohol drinking (alcohol type specified by the keyword) by the author in Hong Kong and in the same year when the blog post was published. In fact, only 11.5% (19/165) of them did so, with limited information regarding the drinking amount and duration. It was thus difficult to differentiate between binge and non-binge drinking (binge drinking=0%; non-binge drinking=26.3%, 5/19; undetermined=73.7%, 14/19) (<xref ref-type="fig" rid="figure9">Figure 9</xref>; [<xref ref-type="bibr" rid="ref35">35</xref>]). The others were mostly personal diary, opinion, or emotional outlet (28.1%, 41/146) (<xref ref-type="fig" rid="figure10">Figure 10</xref>). In <xref ref-type="fig" rid="figure10">Figure 10</xref>, the name is the name of a place, person, or entity not belonging to alcohol, eg, lyrics; recipe is recipe or dish name; news is the news/copied article from an external source; story is the story narrative/film synopsis; health info is the health or educational information; featured article is the non-opinionated featured article; personal diary is a personal diary, opinion, or emotional outlet. The immediate text surrounding the keyword(s) was first examined. If a decision was not made or the keywords were too disperse, the entire blog post was examined. Former options should be considered before latter ones.</p>
                    <fig id="figure3" position="float">
                        <label>Figure 3</label>
                        <caption>
                            <p>Actual prevalence of blogs with alcohol-related keywords in MySinaBlog from 2005-2010 classified according to authorship (corporational or organizational blogs were counted as multiple authors; different blog posts by the same registered user in the same year were counted as one blog).</p>
                        </caption>
                        <graphic xlink:href="jmir_v15i9e192_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                    <fig id="figure4" position="float">
                        <label>Figure 4</label>
                        <caption>
                            <p>Actual prevalence of blogs with alcohol-related keywords in MySinaBlog from 2005-2010 classified according to sex of the single authors.</p>
                        </caption>
                        <graphic xlink:href="jmir_v15i9e192_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                    <fig id="figure5" position="float">
                        <label>Figure 5</label>
                        <caption>
                            <p>Actual prevalence of blogs with alcohol-related keywords in MySinaBlog from 2005-2010 classified according to age of the single authors.</p>
                        </caption>
                        <graphic xlink:href="jmir_v15i9e192_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                    <fig id="figure6" position="float">
                        <label>Figure 6</label>
                        <caption>
                            <p>Point frequency of &#34;beer or wine&#34; keywords in main body of the blog posts of MySinaBlog from 2005-2010.</p>
                        </caption>
                        <graphic xlink:href="jmir_v15i9e192_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                    <fig id="figure7" position="float">
                        <label>Figure 7</label>
                        <caption>
                            <p>Point frequency of &#34;spirit&#34; keywords in main body of the blog posts of MySinaBlog from 2005-2010.</p>
                        </caption>
                        <graphic xlink:href="jmir_v15i9e192_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                    <fig id="figure8" position="float">
                        <label>Figure 8</label>
                        <caption>
                            <p>Actual prevalence of blog posts with alcohol-related keywords in MySinaBlog from 2005-2010 classified according to description of a discrete episode of alcohol drinking (alcohol used for cooking was excluded).</p>
                        </caption>
                        <graphic xlink:href="jmir_v15i9e192_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                    <fig id="figure9" position="float">
                        <label>Figure 9</label>
                        <caption>
                            <p>Actual prevalence of blog posts with alcohol-related keywords and description of a discrete episode of alcohol drinking in MySinaBlog from 2005-2010 classified according to drinking pattern (binge drinking defined as 5 alcoholic drinks in a row within a couple of hours).</p>
                        </caption>
                        <graphic xlink:href="jmir_v15i9e192_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                    <fig id="figure10" position="float">
                        <label>Figure 10</label>
                        <caption>
                            <p>Actual prevalence of blog posts with alcohol-related keywords but no description of a discrete episode of alcohol drinking in MySinaBlog from 2005-2010 classified according to genre.</p>
                        </caption>
                        <graphic xlink:href="jmir_v15i9e192_fig10.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                </sec>
            </sec>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <sec>
                <title>Changes in the Online Popularity of Alcohol-Related Concepts</title>
                <p>The online popularity of alcohol-related concepts was best represented by their prevalence rate and ratio, which normalized the effect of any changes in the total number of blogs [<xref ref-type="bibr" rid="ref14">14</xref>]. In general, the concept &#8220;alcohol&#8221; was most popular in 2008. The concept &#8220;spirit&#8221; also experienced a short-lasting and somewhat erratic rise in its online popularity in 2008-2009. The concept &#8220;beer or wine&#8221;, in contrast, became increasingly unwelcome with an overall declining trend in its online popularity over the years. The hypothesis that alcohol-related concepts became more popular after 2007-2008 was true only for &#8220;alcohol&#8221; and &#8220;spirit&#8221; but not &#8220;beer or wine&#8221;.</p>
                <p>One possible reason for the increase in the online popularity of &#8220;spirit&#8221; keywords in 2008-2009 was the presence of spam in the same years. This was masked in the apparent prevalence, which was used to calculate the prevalence rate and ratio. Indeed, after excluding the data in 2008-2009, the prevalence rate and ratio of the concept &#8220;spirit&#8221; remained relatively stable at a low level. The false elevation in the online popularity of &#8220;spirit&#8221; might also explain the peak prevalence rate of &#8220;alcohol&#8221; in 2008, although the latter appeared much larger in amplitude and there was still a chance for a genuine rise in keywords which were not included in &#8220;beer or wine&#8221; or &#8220;spirit&#8221; but &#8220;alcohol&#8221;. The downhill course in the online popularity of &#8220;beer or wine&#8221; was probably a true reflection of bloggers&#8217; decreased interest over the topic. However, its relation to local drinking pattern remained doubtful, since many of the blog posts were in fact not describing a discrete episode of alcohol drinking. The same argument held true for the concepts &#8220;spirit&#8221; and &#8220;alcohol&#8221;.</p>
            </sec>
            <sec>
                <title>Validating Blog Searching as an Infoveillance Method for Surveying Drinking Patterns</title>
                <p>Validation of blog searching data depended on correlation analysis and manual analysis of blog author characteristics and contents. The prevalence rate of &#8220;alcohol&#8221; was the only parameter that had a significant nonlinear and a marginally significant linear correlation with per capita alcohol consumption. The other correlations were all nonsignificant, although many of them demonstrated moderate to strong strengths. The hypothesis that infodemiological data correlated significantly with local epidemiological data was true only for &#8220;alcohol&#8221; prevalence rate. The statistical nonsignificance of other infodemiological metrics might be explained by the small number of blog posts relative to the population. This in turn could be attributed to the following:</p>
                <list list-type="order">
                    <list-item>
                        <p>Choice of keywords. The list of keywords for &#8220;beer or wine&#8221; and &#8220;spirit&#8221; could never be exhaustive since their types were many and expressions by bloggers were highly variable. Mixed code of Chinese characters and English letters was not uncommon for online communications among Hong Kong people. Some of them would actually type Cantonese (dialect of Yue Chinese) rather than standard Chinese [<xref ref-type="bibr" rid="ref53">53</xref>]. They might use a different Chinese word as the translation of the same liquor. They might also use the brand name of the liquor they took. This was partly reflected by the frequency of individual alcohol-related keyword in the blog posts, showing that some were not used by bloggers at all. All these added difficulties in selecting the appropriate keywords that gave an adequate coverage within the word limit of the search query.</p>
                    </list-item>
                    <list-item>
                        <p>Passive blogging behavior among Hong Kong people. In a survey done by the HKSAR Government in February to April 2011, 53.4% of Internet users had browsed contents at forums or blogs in the preceding 12 months, yet only around 15.8% had compiled or created webpages or blogs in the same period [<xref ref-type="bibr" rid="ref42">42</xref>].</p>
                    </list-item>
                </list>
                <p>From the manual analysis, most blogs were managed by single authors, meaning that the number of blogs could be used to represent the number of individual attendants in a population survey. The sex distribution of the single blog authors was close to the local population, but their age range was slightly inclined to 18 years old and above [<xref ref-type="bibr" rid="ref54">54</xref>]. It should be noted, however, that many of the bloggers did not disclose their identity online, making validation difficult.</p>
                <p>Many of the blog posts were not about a discrete episode of alcohol drinking but personal diary, opinion, or emotion outlet. This was not surprising as new genres of blogs continued to emerge [<xref ref-type="bibr" rid="ref55">55</xref>]. Rather than just being informative, many blogs were affective in nature requiring semantic analysis for meaningful interpretation [<xref ref-type="bibr" rid="ref25">25</xref>]. While it was unlikely that bloggers recorded their alcohol intake on each occasion, they might reveal their understanding on alcohol drinking when commenting on a particular event, answering a particular question, and describing a childhood incident, etc, hence, the presence of alcohol-related keywords. While there were inadequate clues to support that changes in the online popularity of the alcohol-related keywords were related to an altered drinking pattern of the local population, one should not ignore its social implications and disregard its role in evaluating public reactions towards health-related policy including the zero beer and wine tax.</p>
            </sec>
            <sec>
                <title>Research Limitations and Solutions</title>
                <p>Using blogs as the source of information had several inherent limitations. For example, demographic data of individual blogger such as gender, age, and race might be deficient or disguised; bloggers tended to share common interests and backgrounds that were probably different from those of the general population; and acquisition of precise data such as drinking patterns was often difficult. In order to construct a larger framework in a timely and efficient manner, informatics researchers often had to compromise the individuality of each blogger by using certain infodemiological metrics. Moreover, language usage by bloggers tended to be complex and not easily decoded by the frequency of some pre-determined keywords. As a solution, semantic analysis of individual blog post might be useful to explore bloggers&#8217; opinions towards drinking, provided enough technical support. Face-to-face interviews and questionnaires might be conducted with individual bloggers to elaborate their viewpoints, preferably those who appeared to have the largest influence within a specific blog circle (using a social network analytic tool).</p>
                <p>No single blog search engine indexed all blogs [<xref ref-type="bibr" rid="ref56">56</xref>]. Despite its automaticity, a search engine might be subject to editorial choice and hence bias [<xref ref-type="bibr" rid="ref57">57</xref>]. There were concerns that even in the same search engine, the search results may be different over time [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref44">44</xref>]. In our case, it might be explained by the (1) inherent limitation in the search algorithms of Google, which gave only an approximate estimate for query with large results, and (2) inconsistency of the search database due to a variable number of splogs (or spam blogs) and blogs that were previously not linked [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref56">56</xref>]. Of note, a large part of the Google Search algorithm was unknown to the public, aggravating sampling uncertainty in our study.</p>
                <p>One challenge with the use of Chinese language in blog searching was that it tended to have a wide range of expressions owing to geographical difference and translation from English. Also, only a limited number of blog analytic tools supported the Chinese language. A self-designed research program with well-informed blog search algorithms and analytic functions especially for Chinese blogs would be most desirable, which would depend heavily on the availability of expertise and resources.</p>
            </sec>
            <sec>
                <title>Conclusion and Recommendations for Future Research</title>
                <p>Using blog searching data from a Hong Kong&#8211;based Chinese blog service provider, we concluded the following: (1) the online popularity of alcohol-related Chinese keywords was attributed to many different factors including spam, and hence not a specific reflection of local drinking patterns, (2) correlation between infodemiological data (represented by prevalence rates and ratios of alcohol-related concepts) and epidemiological data (represented by per capita alcohol consumption) was poor, and (3) many blog posts were affective rather than informative in nature. While blog searches using pre-defined Chinese keywords might not be an ideal method to survey epidemiological data such as alcohol consumption, semantic analysis of blog content would provide invaluable information on public reactions towards health-related policy, given enough expertise and resources.</p>
            </sec>
        </sec>
    </body>
    <back>
        <glossary>
            <title>Abbreviations</title>
            <def-list>
                <def-item>
                    <term id="abb1">HKSAR</term>
                    <def>
                        <p>Hong Kong Special Administrative Region</p>
                    </def>
                </def-item>
            </def-list>
        </glossary>
        <ack>
            <p>We thank Dr LM Ho from the School of Public Health, University of Hong Kong, for statistical advice.</p>
        </ack>
        <fn-group>
            <fn fn-type="conflict">
                <p>None declared.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>International Agency For Research on Cancer</collab>
                        <collab>World Health Organization</collab>
                    </person-group>
                    <source>Alcohol Drinking, in IARC Monographs on the Evaluation of Carcinogenic Risks to Humans</source>
                    <year>1988</year>
                    <access-date>2013-06-26</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://monographs.iarc.fr/ENG/Monographs/vol44/volume44.pdf">http://monographs.iarc.fr/ENG/Monographs/vol44/volume44.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6HfISAYpQ</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>World Health Organization</collab>
                    </person-group>
                    <source>Substance abuse - Facts and figures</source>
                    <year>2012</year>
                    <access-date>2012-05-14</access-date>
                    <comment>Alcohol<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.who.int/substance_abuse/facts/alcohol/en/index.html">http://www.who.int/substance_abuse/facts/alcohol/en/index.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">67eMQSQ3Z</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>World Health Organization</collab>
                    </person-group>
                    <source>2008-2013 Action Plan for the Global Strategy for the Prevention and Control of Noncommunicable Diseases</source>
                    <access-date>2013-06-26</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://whqlibdoc.who.int/publications/2009/9789241597418_eng.pdf">http://whqlibdoc.who.int/publications/2009/9789241597418_eng.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6HfIXwaMY</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>Department of Health, The Government of the Hong Kong Special Administrative Region</collab>
                    </person-group>
                    <source>Action Plan to Reduce Alcohol-related Harm in Hong Kong</source>
                    <year>2011</year>
                    <access-date>2013-06-26</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.change4health.gov.hk/filemanager/common/image/strategic_framework/alcohol_action_plan/action_plan_e.pdf">http://www.change4health.gov.hk/filemanager/common/image/strategic_framework/alcohol_action_plan/action_plan_e.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6HfJ4QRRp</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>Youth Research Centre</collab>
                    </person-group>
                    <source>A Study on the Alcohol Drinking Habits Among Youth in Hong Kong, in Youth Study Series</source>
                    <year>2000</year>
                    <publisher-loc>Hong Kong</publisher-loc>
                    <publisher-name>Youth study series</publisher-name>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://yrc.hkfyg.org.hk/news.aspx?id=6b656879-efed-4886-af11-e74caad87856&#38;corpname=yrc&#38;i=2527&#38;locale=en-US">http://yrc.hkfyg.org.hk/news.aspx?id=6b656879-efed-4886-af11-e74caad87856&#38;corpname=yrc&#38;i=2527&#38;locale=en-US</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6J48LbobX</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>Surveillance and Epidemiology Branch, Department of Health, the Government of the Hong Kong Special Administrative Region</collab>
                    </person-group>
                    <source>Non-communicable Disease Watch</source>
                    <year>2012</year>
                    <access-date>2013-06-26</access-date>
                    <comment>Change for Health - Drink Less or Not at All<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.chp.gov.hk/files/pdf/ncd_watch_may2012.pdf">http://www.chp.gov.hk/files/pdf/ncd_watch_may2012.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6HfJ8m7Yn</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>The Government of the Hong Kong Special Administrative Region</collab>
                    </person-group>
                    <source>The 2007-2008 Budget Speech</source>
                    <year>2007</year>
                    <access-date>2012-05-14</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.budget.gov.hk/2007/eng/speech.htm">http://www.budget.gov.hk/2007/eng/speech.htm</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">67ePWseOw</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>The Government of the Hong Kong Special Administrative Region</collab>
                    </person-group>
                    <source>The 2008-2009 Budget Speech</source>
                    <year>2008</year>
                    <access-date>2012-05-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.budget.gov.hk/2008/eng/speech.html">http://www.budget.gov.hk/2008/eng/speech.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">67MHbYgXI</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lam</surname>
                            <given-names>TH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chim</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <article-title>Controlling alcohol-related global health problems</article-title>
                    <source>Asia Pac J Public Health</source>
                    <year>2010</year>
                    <month>07</month>
                    <volume>22</volume>
                    <issue>3 Suppl</issue>
                    <fpage>203S</fpage>
                    <lpage>208S</lpage>
                    <pub-id pub-id-type="doi">10.1177/1010539510373013</pub-id>
                    <pub-id pub-id-type="medline">20566555</pub-id>
                    <pub-id pub-id-type="pii">22/3_suppl/203S</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wagenaar</surname>
                            <given-names>AC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Salois</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Komro</surname>
                            <given-names>KA</given-names>
                        </name>
                    </person-group>
                    <article-title>Effects of beverage alcohol price and tax levels on drinking: a meta-analysis of 1003 estimates from 112 studies</article-title>
                    <source>Addiction</source>
                    <year>2009</year>
                    <month>02</month>
                    <volume>104</volume>
                    <issue>2</issue>
                    <fpage>179</fpage>
                    <lpage>90</lpage>
                    <pub-id pub-id-type="doi">10.1111/j.1360-0443.2008.02438.x</pub-id>
                    <pub-id pub-id-type="medline">19149811</pub-id>
                    <pub-id pub-id-type="pii">ADD2438</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>M&#228;kel&#228;</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Osterberg</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Weakening of one more alcohol control pillar: a review of the effects of the alcohol tax cuts in Finland in 2004</article-title>
                    <source>Addiction</source>
                    <year>2009</year>
                    <month>04</month>
                    <volume>104</volume>
                    <issue>4</issue>
                    <fpage>554</fpage>
                    <lpage>63</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19335654" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1111/j.1360-0443.2009.02517.x</pub-id>
                    <pub-id pub-id-type="medline">19335654</pub-id>
                    <pub-id pub-id-type="pii">ADD2517</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2928916</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Herttua</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>M&#228;kel&#228;</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Martikainen</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>The effects of a large reduction in alcohol prices on hospitalizations related to alcohol: a population-based natural experiment</article-title>
                    <source>Addiction</source>
                    <year>2011</year>
                    <month>04</month>
                    <volume>106</volume>
                    <issue>4</issue>
                    <fpage>759</fpage>
                    <lpage>67</lpage>
                    <pub-id pub-id-type="doi">10.1111/j.1360-0443.2010.03296.x</pub-id>
                    <pub-id pub-id-type="medline">21205044</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Koski</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sir&#233;n</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Vuori</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Poikolainen</surname>
                            <given-names>K</given-names>
                        </name>
                    </person-group>
                    <article-title>Alcohol tax cuts and increase in alcohol-positive sudden deaths: a time-series intervention analysis</article-title>
                    <source>Addiction</source>
                    <year>2007</year>
                    <month>03</month>
                    <volume>102</volume>
                    <issue>3</issue>
                    <fpage>362</fpage>
                    <lpage>8</lpage>
                    <pub-id pub-id-type="doi">10.1111/j.1360-0443.2006.01715.x</pub-id>
                    <pub-id pub-id-type="medline">17298642</pub-id>
                    <pub-id pub-id-type="pii">ADD1715</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Infodemiology and infoveillance: framework for an emerging set of public health informatics methods to analyze search, communication and publication behavior on the Internet</article-title>
                    <source>J Med Internet Res</source>
                    <year>2009</year>
                    <volume>11</volume>
                    <issue>1</issue>
                    <fpage>e11</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2009/1/e11/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.1157</pub-id>
                    <pub-id pub-id-type="medline">19329408</pub-id>
                    <pub-id pub-id-type="pii">v11i1e11</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2762766</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Infodemiology and infoveillance tracking online health information and cyberbehavior for public health</article-title>
                    <source>Am J Prev Med</source>
                    <year>2011</year>
                    <month>05</month>
                    <volume>40</volume>
                    <issue>5 Suppl 2</issue>
                    <fpage>S154</fpage>
                    <lpage>8</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.amepre.2011.02.006</pub-id>
                    <pub-id pub-id-type="medline">21521589</pub-id>
                    <pub-id pub-id-type="pii">S0749-3797(11)00088-2</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Infodemiology: tracking flu-related searches on the web for syndromic surveillance</article-title>
                    <source>AMIA Annu Symp Proc</source>
                    <year>2006</year>
                    <fpage>244</fpage>
                    <lpage>8</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/17238340" />
                    </comment>
                    <pub-id pub-id-type="medline">17238340</pub-id>
                    <pub-id pub-id-type="pii">86095</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1839505</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Infodemiology: The epidemiology of (mis)information</article-title>
                    <source>Am J Med</source>
                    <year>2002</year>
                    <month>12</month>
                    <day>15</day>
                    <volume>113</volume>
                    <issue>9</issue>
                    <fpage>763</fpage>
                    <lpage>5</lpage>
                    <pub-id pub-id-type="medline">12517369</pub-id>
                    <pub-id pub-id-type="pii">S0002934302014730</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ginsberg</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mohebbi</surname>
                            <given-names>MH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Patel</surname>
                            <given-names>RS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brammer</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Smolinski</surname>
                            <given-names>MS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brilliant</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Detecting influenza epidemics using search engine query data</article-title>
                    <source>Nature</source>
                    <year>2009</year>
                    <month>02</month>
                    <day>19</day>
                    <volume>457</volume>
                    <issue>7232</issue>
                    <fpage>1012</fpage>
                    <lpage>4</lpage>
                    <pub-id pub-id-type="doi">10.1038/nature07634</pub-id>
                    <pub-id pub-id-type="medline">19020500</pub-id>
                    <pub-id pub-id-type="pii">nature07634</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wilson</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brownstein</surname>
                            <given-names>JS</given-names>
                        </name>
                    </person-group>
                    <article-title>Early detection of disease outbreaks using the Internet</article-title>
                    <source>CMAJ</source>
                    <year>2009</year>
                    <month>04</month>
                    <day>14</day>
                    <volume>180</volume>
                    <issue>8</issue>
                    <fpage>829</fpage>
                    <lpage>31</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.cmaj.ca/cgi/pmidlookup?view=long&#38;pmid=19364791" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1503/cmaj.090215</pub-id>
                    <pub-id pub-id-type="medline">19364791</pub-id>
                    <pub-id pub-id-type="pii">180/8/829</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2665960</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Althouse</surname>
                            <given-names>BM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ng</surname>
                            <given-names>YY</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cummings</surname>
                            <given-names>DA</given-names>
                        </name>
                    </person-group>
                    <article-title>Prediction of dengue incidence using search query surveillance</article-title>
                    <source>PLoS Negl Trop Dis</source>
                    <year>2011</year>
                    <month>08</month>
                    <volume>5</volume>
                    <issue>8</issue>
                    <fpage>e1258</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pntd.0001258" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pntd.0001258</pub-id>
                    <pub-id pub-id-type="medline">21829744</pub-id>
                    <pub-id pub-id-type="pii">PNTD-D-11-00369</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3149016</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wong</surname>
                            <given-names>PW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Fu</surname>
                            <given-names>KW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yau</surname>
                            <given-names>RS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ma</surname>
                            <given-names>HH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Law</surname>
                            <given-names>YW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chang</surname>
                            <given-names>SS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Yip</surname>
                            <given-names>PS</given-names>
                        </name>
                    </person-group>
                    <article-title>Accessing suicide-related information on the internet: a retrospective observational study of search behavior</article-title>
                    <source>J Med Internet Res</source>
                    <year>2013</year>
                    <volume>15</volume>
                    <issue>1</issue>
                    <fpage>e3</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/1/e3/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2181</pub-id>
                    <pub-id pub-id-type="medline">23305632</pub-id>
                    <pub-id pub-id-type="pii">v15i1e3</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3636013</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ayers</surname>
                            <given-names>JW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Althouse</surname>
                            <given-names>BM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Allem</surname>
                            <given-names>JP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ford</surname>
                            <given-names>DE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ribisl</surname>
                            <given-names>KM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cohen</surname>
                            <given-names>JE</given-names>
                        </name>
                    </person-group>
                    <article-title>A novel evaluation of World No Tobacco day in Latin America</article-title>
                    <source>J Med Internet Res</source>
                    <year>2012</year>
                    <volume>14</volume>
                    <issue>3</issue>
                    <fpage>e77</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2012/3/e77/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2148</pub-id>
                    <pub-id pub-id-type="medline">22634568</pub-id>
                    <pub-id pub-id-type="pii">v14i3e77</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ayers</surname>
                            <given-names>JW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ribisl</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brownstein</surname>
                            <given-names>JS</given-names>
                        </name>
                    </person-group>
                    <article-title>Using search query surveillance to monitor tax avoidance and smoking cessation following the United States' 2009 &#34;SCHIP&#34; cigarette tax increase</article-title>
                    <source>PLoS One</source>
                    <year>2011</year>
                    <volume>6</volume>
                    <issue>3</issue>
                    <fpage>e16777</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0016777" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0016777</pub-id>
                    <pub-id pub-id-type="medline">21436883</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3059206</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Chew</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Pandemics in the age of Twitter: content analysis of Tweets during the 2009 H1N1 outbreak</article-title>
                    <source>PLoS One</source>
                    <year>2010</year>
                    <volume>5</volume>
                    <issue>11</issue>
                    <fpage>e14118</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0014118" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0014118</pub-id>
                    <pub-id pub-id-type="medline">21124761</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2993925</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kamel Boulos</surname>
                            <given-names>MN</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sanfilippo</surname>
                            <given-names>AP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Corley</surname>
                            <given-names>CD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wheeler</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>Social Web mining and exploitation for serious applications: Technosocial Predictive Analytics and related technologies for public health, environmental and national security surveillance</article-title>
                    <source>Comput Methods Programs Biomed</source>
                    <year>2010</year>
                    <month>10</month>
                    <volume>100</volume>
                    <issue>1</issue>
                    <fpage>16</fpage>
                    <lpage>23</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.cmpb.2010.02.007</pub-id>
                    <pub-id pub-id-type="medline">20236725</pub-id>
                    <pub-id pub-id-type="pii">S0169-2607(10)00038-6</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <collab>Institute of Medicine (US) Forum on Microbial Threats</collab>
                    </person-group>
                    <source>Global Infectious Disease Surveillance and Detection: Assessing the Challenges--Finding Solutions, Workshop Summary</source>
                    <year>2007</year>
                    <publisher-loc>Washington, DC</publisher-loc>
                    <publisher-name>National Academies Press</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>H</given-names>
                        </name>
                    </person-group>
                    <article-title>Research on Knowledge Sharing Mechanism Based on Web 2.0</article-title>
                    <source>International Seminar on Future Information Technology and Management Engineering</source>
                    <year>2008</year>
                    <conf-name>FITME '08</conf-name>
                    <conf-date>Nov. 20, 2008</conf-date>
                    <conf-loc>Leicestershire, UK</conf-loc>
                    <fpage>210</fpage>
                    <lpage>213</lpage>
                    <pub-id pub-id-type="doi">10.1109/fitme.2008.14</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Russell</surname>
                            <given-names>MA</given-names>
                        </name>
                    </person-group>
                    <article-title>s</article-title>
                    <source>Mining the Social Web: Analyzing Data from Facebook, Twitter, LinkedIn, and Other Social Media Site</source>
                    <year>2011</year>
                    <publisher-loc>Sebastopol, CA</publisher-loc>
                    <publisher-name>O&#039;Reilly Media</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref29">
                <label>29</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Rosenbloom</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>The blogosphere</article-title>
                    <source>Communications of the ACM</source>
                    <year>2004</year>
                    <month>12</month>
                    <day>01</day>
                    <volume>47</volume>
                    <issue>12</issue>
                    <fpage>30</fpage>
                    <pub-id pub-id-type="doi">10.1145/1035134.1035161</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref30">
                <label>30</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kwai Fun IP</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wagner</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>Weblogging: A study of social computing and its impact on organizations</article-title>
                    <source>Decision Support Systems</source>
                    <year>2008</year>
                    <month>5</month>
                    <volume>45</volume>
                    <issue>2</issue>
                    <fpage>242</fpage>
                    <lpage>250</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.dss.2007.02.004</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref31">
                <label>31</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Du</surname>
                            <given-names>HS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wagner</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>Weblog success: Exploring the role of technology</article-title>
                    <source>International Journal of Human-Computer Studies</source>
                    <year>2006</year>
                    <month>9</month>
                    <volume>64</volume>
                    <issue>9</issue>
                    <fpage>789</fpage>
                    <lpage>798</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.ijhcs.2006.04.002</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref32">
                <label>32</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Nardi</surname>
                            <given-names>BA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schiano</surname>
                            <given-names>DJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gumbrecht</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Swartz</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Why we blog</article-title>
                    <source>Communications of the ACM</source>
                    <year>2004</year>
                    <month>12</month>
                    <day>01</day>
                    <volume>47</volume>
                    <issue>12</issue>
                    <fpage>41</fpage>
                    <pub-id pub-id-type="doi">10.1145/1035134.1035163</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref33">
                <label>33</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Qian</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Craig</surname>
                            <given-names>RS</given-names>
                        </name>
                    </person-group>
                    <article-title>Anonymity and Self-Disclosure on Weblogs</article-title>
                    <source>Journal of Computer-Mediated Communication</source>
                    <year>2007</year>
                    <volume>12</volume>
                    <issue>4</issue>
                    <fpage>1428</fpage>
                    <lpage>1451</lpage>
                    <pub-id pub-id-type="doi">10.1111/j.1083-6101.2007.00380.x</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref34">
                <label>34</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Chau</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Xu</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cao</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lam</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Shiu</surname>
                            <given-names>B</given-names>
                        </name>
                    </person-group>
                    <article-title>A Blog Mining Framework</article-title>
                    <source>IT Prof</source>
                    <year>2009</year>
                    <month>01</month>
                    <volume>11</volume>
                    <issue>1</issue>
                    <fpage>36</fpage>
                    <lpage>41</lpage>
                    <pub-id pub-id-type="doi">10.1109/mitp.2009.1</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref35">
                <label>35</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Thelwall</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Blog searching: The first general-purpose source of retrospective public opinion in the social sciences?</article-title>
                    <source>Online Information Review</source>
                    <year>2007</year>
                    <volume>31</volume>
                    <issue>3</issue>
                    <fpage>277</fpage>
                    <lpage>289</lpage>
                    <pub-id pub-id-type="doi">10.1108/14684520710764069</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref36">
                <label>36</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lu</surname>
                            <given-names>H</given-names>
                        </name>
                    </person-group>
                    <article-title>Public Opinion between Blogsphere and Real World</article-title>
                    <source>Proceedings of the Annual Conference of the World Association for Public Opinion Research</source>
                    <year>2012</year>
                    <conf-name>The Annual Conference of the World Association for Public Opinion Research</conf-name>
                    <conf-date>2012</conf-date>
                    <conf-loc>Hong Kong</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref37">
                <label>37</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Chau</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Xu</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Mining communities and their relationships in blogs: A study of online hate groups</article-title>
                    <source>International Journal of Human-Computer Studies</source>
                    <year>2007</year>
                    <month>1</month>
                    <volume>65</volume>
                    <issue>1</issue>
                    <fpage>57</fpage>
                    <lpage>70</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.ijhcs.2006.08.009</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref38">
                <label>38</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tsai</surname>
                            <given-names>FS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chan</surname>
                            <given-names>KL</given-names>
                        </name>
                    </person-group>
                    <article-title>Blog search and mining in the business domain</article-title>
                    <source>Proceedings of the 2007 international workshop on Domain driven data mining</source>
                    <year>2007</year>
                    <conf-name>International workshop on Domain driven data mining</conf-name>
                    <conf-date>Aug. 12-15, 2007</conf-date>
                    <conf-loc>San Jose, CA</conf-loc>
                    <fpage>55</fpage>
                    <lpage>60</lpage>
                    <pub-id pub-id-type="doi">10.1145/1288552.1288560</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref39">
                <label>39</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Conrad</surname>
                            <given-names>JG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schilder</surname>
                            <given-names>F</given-names>
                        </name>
                    </person-group>
                    <article-title>Opinion mining in legal blogs</article-title>
                    <source>Proceedings of the 11th international conference on Artificial intelligence and law</source>
                    <year>2007</year>
                    <conf-name>11th International conference on Artificial intelligence and law</conf-name>
                    <conf-date>June 4-8, 2007</conf-date>
                    <conf-loc>Palo Alto</conf-loc>
                    <fpage>231</fpage>
                    <lpage>236</lpage>
                    <pub-id pub-id-type="doi">10.1145/1276318.1276363</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref40">
                <label>40</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>O'Leary</surname>
                            <given-names>DE</given-names>
                        </name>
                    </person-group>
                    <article-title>Blog mining-review and extensions: &#8220;From each according to his opinion&#8221;</article-title>
                    <source>Decision Support Systems</source>
                    <year>2011</year>
                    <month>11</month>
                    <volume>51</volume>
                    <issue>4</issue>
                    <fpage>821</fpage>
                    <lpage>830</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.dss.2011.01.016</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref41">
                <label>41</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>Social Surveys Section</collab>
                        <collab>Census and Statistics Department</collab>
                        <collab>The Government of the Hong Kong Special Administrative Region</collab>
                    </person-group>
                    <source>Thematic Household Survey Report No 50</source>
                    <year>2013</year>
                    <access-date>2013-06-26</access-date>
                    <publisher-loc>Hong Kong</publisher-loc>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.digital21.gov.hk/eng/statistics/download/householdreport2013.pdf">http://www.digital21.gov.hk/eng/statistics/download/householdreport2013.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6HfJGQcWU</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref42">
                <label>42</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>Social Surveys Section</collab>
                        <collab>Census and Statistics Department</collab>
                        <collab>The Government of the Hong Kong Special Administrative Region</collab>
                    </person-group>
                    <source>Thematic Household Survey Report No 49</source>
                    <year>2012</year>
                    <access-date>2013-06-26</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.statistics.gov.hk/pub/B11302492012XXXXB0100.pdf">http://www.statistics.gov.hk/pub/B11302492012XXXXB0100.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6HfJMGSO6</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref43">
                <label>43</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>Blog-You</collab>
                    </person-group>
                    <source>Hong Kong Blogger Survey Result</source>
                    <access-date>2012-05-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://blog-you.com/events/survey/">http://blog-you.com/events/survey/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">67M9R7Q18</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref44">
                <label>44</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Thelwall</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hasler</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Blog search engines</article-title>
                    <source>Online Information Review</source>
                    <year>2007</year>
                    <volume>31</volume>
                    <issue>4</issue>
                    <fpage>467</fpage>
                    <lpage>479</lpage>
                    <pub-id pub-id-type="doi">10.1108/14684520710780421</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref45">
                <label>45</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>GH (HONGKONG) CO</collab>
                    </person-group>
                    <source>Hong Kong Free Blog Websites</source>
                    <access-date>2013-04-11</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://852.com/internet/free_blog.htm">http://852.com/internet/free_blog.htm</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6Fo1Qxrhe</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref46">
                <label>46</label>
                <nlm-citation citation-type="web">
                    <source>TopTenReviews</source>
                    <access-date>2013-04-11</access-date>
                    <comment>2013 Blog Service Comparisons<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://blog-services-review.toptenreviews.com/">http://blog-services-review.toptenreviews.com/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6Fo2O3kVX</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref47">
                <label>47</label>
                <nlm-citation citation-type="web">
                    <source>Alexa Internet</source>
                    <access-date>2013-08-20</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.alexa.com/">http://www.alexa.com/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6J1Za5Y4c</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref48">
                <label>48</label>
                <nlm-citation citation-type="web">
                    <source>StatsCrop</source>
                    <access-date>2013-08-20</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.statscrop.com/">http://www.statscrop.com/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6J1Zbrijf</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref49">
                <label>49</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>Alexa Internet</collab>
                    </person-group>
                    <source>MySinaBlog. Site Info</source>
                    <access-date>2012-05-02</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.alexa.com/siteinfo/mysinablog.com">http://www.alexa.com/siteinfo/mysinablog.com</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">67MRoycuX</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref50">
                <label>50</label>
                <nlm-citation citation-type="web">
                    <source>Lin Yutang&#039;s Chinese-English Dictionary of Modern Usage (Online Version)</source>
                    <access-date>2013-08-20</access-date>
                    <publisher-loc>English</publisher-loc>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://humanum.arts.cuhk.edu.hk/Lexis/Lindict/">http://humanum.arts.cuhk.edu.hk/Lexis/Lindict/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6J1Zgxl06</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref51">
                <label>51</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>Office of Dutiable Commodities Administration, Customs and Excise Department, The Government of the Hong Kong Administrative Region</collab>
                    </person-group>
                    <source>Removal of Licensing/Permit Arrangements on Wine and Liquor with an Alcoholic Strength of not more than 30%, 2008: Hong Kong</source>
                    <access-date>2013-06-26</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.customs.gov.hk/filemanager/common/pdf/pdf_notice/fact_sheet_eng.pdf">http://www.customs.gov.hk/filemanager/common/pdf/pdf_notice/fact_sheet_eng.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6HfJS66Ty</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref52">
                <label>52</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Chan</surname>
                            <given-names>MK</given-names>
                        </name>
                    </person-group>
                    <article-title>Concordancers and concordances: Tools for Chinese language teaching and research</article-title>
                    <source>Journal-Chinese Language Teachers Association</source>
                    <year>2002</year>
                    <volume>37</volume>
                    <issue>2</issue>
                    <fpage>1</fpage>
                    <lpage>58</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref53">
                <label>53</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Chiu</surname>
                            <given-names>WN</given-names>
                        </name>
                    </person-group>
                    <source>Language Choice on the Internet: The Use of Written Cantonese on Web Sites</source>
                    <year>2005</year>
                    <publisher-loc>Hong Kong</publisher-loc>
                    <publisher-name>University of Hong Kong</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref54">
                <label>54</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>General Statistics Section, Census and Statistics Department, The Government of the Hong Kong Special Administrative Region</collab>
                    </person-group>
                    <source>Hong Kong Monthly Digest of Statistics (April 2013), 2013: Hong Kong</source>
                    <access-date>2013-06-26</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.statistics.gov.hk/pub/B10100022013MM04B0100.pdf">http://www.statistics.gov.hk/pub/B10100022013MM04B0100.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6HfJWRiVh</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref55">
                <label>55</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Herring</surname>
                            <given-names>SC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Scheidt</surname>
                            <given-names>LA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bonus</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wright</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Bridging the gap: A genre analysis of weblogs</article-title>
                    <source>Proceedings of the 37th Hawaii International Conference on System Sciences</source>
                    <year>2004</year>
                    <conf-name>37th Hawaii International Conference on System Sciences</conf-name>
                    <conf-date>Jan. 5-8, 2004</conf-date>
                    <conf-loc>Big Island, Hawaii</conf-loc>
                    <publisher-name>IEEE</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref56">
                <label>56</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Walejko</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Splogs and Abandoned Blogs: The perils of sampling bloggers and their blogs</article-title>
                    <source>Information, Communication &#38; Society</source>
                    <year>2008</year>
                    <month>03</month>
                    <volume>11</volume>
                    <issue>2</issue>
                    <fpage>279</fpage>
                    <lpage>296</lpage>
                    <pub-id pub-id-type="doi">10.1080/13691180801947976</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref57">
                <label>57</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Goldman</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <person-group person-group-type="editor">
                        <name name-style="western">
                            <surname>Spink</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zimmer</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Search Engine Bias and the Demise of Search Engine Utopianism</article-title>
                    <source>Web Search</source>
                    <year>2008</year>
                    <publisher-loc>Berlin</publisher-loc>
                    <publisher-name>Springer</publisher-name>
                    <fpage>121</fpage>
                    <lpage>133</lpage>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>
