<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">JMIR</journal-id>
            <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
            <journal-title>Journal of Medical Internet Research</journal-title>
            <issn pub-type="epub">14388871</issn>
            <publisher>
                <publisher-name>JMIR Publications Inc.</publisher-name>
                <publisher-loc>Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v16i2e29</article-id>
            <article-id pub-id-type="pmid">24496094</article-id>
            <article-id pub-id-type="doi">10.2196/jmir.3078</article-id>
            <article-categories>
                <subj-group subj-group-type="article-type">
                    <subject>Original Paper</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Investigating the Congruence of Crowdsourced Information With Official Government Data: The Case of Pediatric Clinics</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="editor">
                    <name>
                        <surname>Eysenbach</surname>
                        <given-names>Gunther</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Choi</surname>
                        <given-names>Jinwook</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Tak</surname>
                        <given-names>Hyojung</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Lee</surname>
                        <given-names>Jooyoung</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Erdley</surname>
                        <given-names>Scott</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1" corresp="yes">
                    <name name-style="western">
                        <surname>Kim</surname>
                        <given-names>Minki</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                    <address>
                        <institution>Department of Business and Technology Management</institution>
                        <institution>Korea Advanced Institute of Science and Technology</institution>
                        <addr-line>KAIST N5-2109</addr-line>
                        <addr-line>291 Daehak-ro, Yuseong-gu</addr-line>
                        <addr-line>Daejeon, 305-701</addr-line>
                        <country>Korea, Republic Of</country>
                        <phone>82 423506315</phone>
                        <fax>82 423506339</fax>
                        <email>minki.kim@kaist.ac.kr</email>
                    </address>
                </contrib>
                <contrib contrib-type="author" id="contrib2">
                    <name name-style="western">
                        <surname>Jung</surname>
                        <given-names>Yuchul</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref ref-type="aff" rid="aff2">2</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-8871-1979</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib3">
                    <name name-style="western">
                        <surname>Jung</surname>
                        <given-names>Dain</given-names>
                    </name>
                    <xref ref-type="aff" rid="aff1">1</xref>
                </contrib>
                <contrib contrib-type="author" id="contrib4">
                    <name name-style="western">
                        <surname>Hur</surname>
                        <given-names>Cinyoung</given-names>
                    </name>
                    <degrees>MS</degrees>
                    <xref ref-type="aff" rid="aff3">3</xref>
                </contrib>
            </contrib-group>
            <aff id="aff1" rid="aff1">
                <sup>1</sup>
                <institution>Department of Business and Technology Management</institution>
                <institution>Korea Advanced Institute of Science and Technology</institution>
                <addr-line>Daejeon</addr-line>
                <country>Korea, Republic Of</country>
            </aff>
            <aff id="aff2" rid="aff2">
                <sup>2</sup>
                <institution>Korea Institute of Science and Technology Information</institution>
                <addr-line>Daejeon</addr-line>
                <country>Korea, Republic Of</country>
            </aff>
            <aff id="aff3" rid="aff3">
                <sup>3</sup>
                <institution>Electronics and Telecommunications Research Institute</institution>
                <addr-line>Daejeon</addr-line>
                <country>Korea, Republic Of</country>
            </aff>
            <author-notes>
                <corresp>Corresponding Author: Minki Kim <email>minki.kim@kaist.ac.kr</email>
                </corresp>
            </author-notes>
            <pub-date pub-type="collection">
                <month>02</month>
                <year>2014</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>03</day>
                <month>02</month>
                <year>2014</year>
            </pub-date>
            <volume>16</volume>
            <issue>2</issue>
            <elocation-id>e29</elocation-id>
            <!--history from ojs - api-xml-->
            <history>
                <date date-type="received">
                    <day>03</day>
                    <month>11</month>
                    <year>2013</year>
                </date>
                <date date-type="rev-request">
                    <day>23</day>
                    <month>12</month>
                    <year>2013</year>
                </date>
                <date date-type="rev-recd">
                    <day>07</day>
                    <month>01</month>
                    <year>2014</year>
                </date>
                <date date-type="accepted">
                    <day>09</day>
                    <month>01</month>
                    <year>2014</year>
                </date>
            </history>
            <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
            <copyright-statement>&#169;Minki Kim, Yuchul Jung, Dain Jung, Cinyoung Hur. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 03.02.2014. </copyright-statement>
            <copyright-year>2014</copyright-year>
            <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
                <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
            </license>
            <self-uri xlink:href="http://www.jmir.org/2014/2/e29/" xlink:type="simple" />
            <abstract>
                <sec sec-type="background">
                    <title>Background</title>
                    <p>Health 2.0 is a benefit to society by helping patients acquire knowledge about health care by harnessing collective intelligence. However, any misleading information can directly affect patients&#8217; choices of hospitals and drugs, and potentially exacerbate their health condition.</p>
                </sec>
                <sec sec-type="objective">
                    <title>Objective</title>
                    <p>This study investigates the congruence between crowdsourced information and official government data in the health care domain and identifies the determinants of low congruence where it exists. In-line with infodemiology, we suggest measures to help the patients in the regions vulnerable to inaccurate health information.</p>
                </sec>
                <sec sec-type="methods">
                    <title>Methods</title>
                    <p>We text-mined multiple online health communities in South Korea to construct the data for crowdsourced information on public health services (173,748 messages). Kendall tau and Spearman rank order correlation coefficients were used to compute the differences in 2 ranking systems of health care quality: actual government evaluations of 779 hospitals and mining results of geospecific online health communities. Then we estimated the effect of sociodemographic characteristics on the level of congruence by using an ordinary least squares regression.</p>
                </sec>
                <sec sec-type="results">
                    <title>Results</title>
                    <p>The regression results indicated that the standard deviation of married women&#8217;s education (<italic>P</italic>=.046), population density (<italic>P</italic>=.01), number of doctors per pediatric clinic (<italic>P</italic>=.048), and birthrate (<italic>P</italic>=.002) have a significant effect on the congruence of crowdsourced data (adjusted <italic>R</italic>
                        <sup>
                            <italic>2</italic>
                        </sup>=.33). Specifically, (1) the higher the birthrate in a given region, (2) the larger the variance in educational attainment, (3) the higher the population density, and (4) the greater the number of doctors per clinic, the more likely that crowdsourced information from online communities is congruent with official government data.</p>
                </sec>
                <sec sec-type="conclusions">
                    <title>Conclusions</title>
                    <p>To investigate the cause of the spread of misleading health information in the online world, we adopted a unique approach by associating mining results on hospitals from geospecific online health communities with the sociodemographic characteristics of corresponding regions. We found that the congruence of crowdsourced information on health care services varied across regions and that these variations could be explained by geospecific demographic factors. This finding can be helpful to governments in reducing the potential risk of misleading online information and the accompanying safety issues.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>online health community</kwd>
                <kwd>crowdsourcing</kwd>
                <kwd>risk of misinformation</kwd>
                <kwd>public health</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title>Introduction</title>
            <p>The advancement of information and communications technology has affected every aspect of modern society by enabling people to collectively create and exchange knowledge in pursuing their rights. In this era of Web 2.0, people can make smarter decisions with new interpretations and discoveries based on social interactions through social networking sites and online communities. With a basis in &#8220;trust your users,&#8221; Web 2.0 expedites knowledge acquisition through sharing and collaboration among Web users; that is, through harnessing collective intelligence [<xref ref-type="bibr" rid="ref1">1</xref>]. Given this background, the questions that arise are (1) whether online users are trustworthy at all times, and (2) whether crowdsourced information benefits fields that require specialized knowledge, such as health care and medicine. In public health, it is important to investigate the accuracy of crowdsourced information within online health communities because any misleading information can directly affect patients&#8217; choices of hospitals and drugs and can potentially exacerbate their health conditions. The social costs of inaccurate health information far exceed the financial costs incurred from poor choices of ordinary consumer products and services.</p>
            <p>As the Web has become an important mass medium for consumers seeking health information and health care services online, researchers have focused on the advent of Health 2.0 or Medicine 2.0, which is the application of Web 2.0 technologies to health and medicine [<xref ref-type="bibr" rid="ref2">2</xref>]. In the present era of Medicine 2.0, patients evaluate physicians and hospitals, share their health care experiences, and communicate with other patients through health-related websites [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref5">5</xref>].</p>
            <p>Proliferation of these Medicine 2.0 sites (eg, PatientsLikeMe and Hello Health) benefits society by helping patients acquire knowledge on health through collaboration [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. As a means of promoting health education, Medicine 2.0 has also reshaped doctor-patient relationships, making them more patient friendly [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
            <p>To analyze such health information and communication patterns on websites and social media, considerable literature has accumulated over the years under the name of infodemiology [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>], the science of distribution and determinants of information on the Internet aiming to inform public health and public policy.</p>
            <p>In-line with infodemiology, researchers have attempted to understand and analyze unstructured free-text information available from the Internet, such as health-related user-generated data, or crowdsourced data. For instance, Marcus et al [<xref ref-type="bibr" rid="ref9">9</xref>] searched Internet blogs that contained mental health-related keywords to analyze young adults&#8217; concerns regarding mental health. More recently, Zhang et al [<xref ref-type="bibr" rid="ref10">10</xref>] conducted sentiment analysis by using free-text comments about hospitals on websites and found that crowdsourced data are moderately associated with the paper-based national inpatient survey results in England.</p>
            <p>On the other hand, concerning low quality information on the Internet that could harm public health [<xref ref-type="bibr" rid="ref11">11</xref>], several studies have discussed the potential risk of inaccurate online information and accompanying safety issues. Using Google search results for severe acute respiratory syndrome (SARS) as examples, Morahan [<xref ref-type="bibr" rid="ref12">12</xref>] argued that the overall quality of online health information is a serious concern for people because virtual access to high-quality health information is counterbalanced by high access to inaccurate and even fraudulent information. A systematic review on the quality of health information has found that 70% of studies on this subject have had concerns about the quality of crowdsourced health information. In fact, even too much information affects patients, making them even more confused because they find it harder to distinguish between true and inaccurate health information [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
            <p>Hence, this study focused on the following: (1) whether crowdsourced information built in the online world is accurate, and (2) if imprecise, what drives this information inaccuracy. Similar to our study, Tsai et al [<xref ref-type="bibr" rid="ref14">14</xref>] investigated social networking websites on consumer health and found that more than half of user-generated health information was incomplete or erroneous. Looking at drug information on Wikipedia, a different type of information source, Clauson et al [<xref ref-type="bibr" rid="ref15">15</xref>] also found that there are more omission errors and less completeness in Wikipedia articles than Medscape Drug Reference articles. Consistent with these studies, we show the existence of inaccurate online information. Unlike previous research, however, this study adds to the literature by demonstrating heterogeneous inaccuracy between geospecific online health communities and objective hospital ratings, and by further delving into the offline determinants of such heterogeneity. To the best of our knowledge, no previous empirical study has taken this approach.</p>
            <p>In this study, we investigate the quality of crowdsourced health information by evaluating conformity between 2 rankings: (1) government evaluations of hospitals, and (2) rankings obtained through mining of geospecific online health communities across South Korea</p>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <sec>
                <title>Overview</title>
                <p>We employed 3 types of information source: (1) governmental evaluations of medical services aimed at ranking hospitals in the region, (2) rankings provided by online communities on hospitals according to the crowdsourced information of Web users, and (3) the census results by region provided by Statistics Korea to understand the influence of demographic features on the congruence between crowdsourced information and official government data in the health care domain.</p>
            </sec>
            <sec>
                <title>Government Hospital Evaluation Information</title>
                <p>The sampled hospitals were confined to pediatric offices because young parents more eagerly seek information both online and offline, serving as agents for their children who can seldom self-diagnose the various symptoms they are suffering. According to Plantin and Daneback [<xref ref-type="bibr" rid="ref16">16</xref>], first-time mothers aged 30-35 years are most active in searching for health and patient information on the Internet. Compared with other medical fields, parents of young children more actively share information on pediatrics over online health communities [<xref ref-type="bibr" rid="ref17">17</xref>].</p>
                <p>This study was conducted in the 6 major metropolitan cities of South Korea. Specifically, we examined 30 regions in total, including 25 districts (gu) within Seoul (accounting for one-quarter of the total population of South Korea), and 5 other metropolitan cities: Gwangju, Busan, Daegu, Daejeon, and Incheon. <xref ref-type="fig" rid="figure1">Figure 1</xref> shows the geographic locations of the 30 regions.</p>
                <p>As an objective measure of the medical service quality of local pediatricians, we relied on usage rates of antibiotics. The overuse of antibiotics is a global concern because it can result in severe adverse effects for children [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. In fact, improper or excessive use of antibiotics also results in antibiotic-resistance problems, which, in turn, lead to unnecessary expenditures of public health care funding [<xref ref-type="bibr" rid="ref20">20</xref>]. Korea is no exception in this issue. Antibiotic prescribing behavior has changed after quality assessment of prescriptions were done, including those for antibiotics for treatment of acute upper respiratory tract infections in ambulatory care in 2001 and the public reporting of its results in 2006 [<xref ref-type="bibr" rid="ref21">21</xref>]. Since 2009, to discourage the excessive use of antibiotics, the Health Insurance Review and Assessment Service of Korea (HIRA) [<xref ref-type="bibr" rid="ref22">22</xref>] has provided information on antibiotic usage rates for all hospitals across the nation to the public. The antibiotic usage rate is represented as the total number of antibiotic prescriptions over the total number of visits. We considered this usage rate as a hospital quality index, and based on these HIRA usage rates, we rank-ordered all 779 pediatric clinics in the sampled cities.</p>
                <fig id="figure1" position="float">
                    <label>Figure 1</label>
                    <caption>
                        <p>Geographic regions in South Korea associated with online health communities.</p>
                    </caption>
                    <graphic xlink:href="jmir_v16i2e29_fig1.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Mining Online Health Communities</title>
                <p>To investigate the crowdsourced information for public health in South Korea, particularly on the quality of pediatric clinics, we focused on user-generated content from online communities hosted by Korean Web portals. Preliminary examination showed that online communities specializing in pediatrics served as places for parents to actively discuss (through questions and answers) the quality of pediatric clinics by sharing their thoughts, ideas, and experiences (ie, crowdsourcing). Naver [<xref ref-type="bibr" rid="ref23">23</xref>] is a leading Internet search portal in Korea with an average market share of 78% and Daum [<xref ref-type="bibr" rid="ref24">24</xref>] ranks second with an average market share of 15.22% in 2013 [<xref ref-type="bibr" rid="ref25">25</xref>], and together they maintain the largest online health communities for child-raising parents; therefore, we analyzed the contents of only the local online health communities hosted by Naver and Daum. Furthermore, these 2 sites maintain various online health communities by topic and by region across the nation, such as support groups for cancer patients and general parental care in each local region.</p>
                <p>In particular, we were interested in the frequencies at which hospital names appeared in discussions on these websites. To ensure that frequently mentioned hospitals were more likely to be recognized as providing high-quality care, we only considered users&#8217; responses to others&#8217; requests for hospital recommendations. A certain user response could denote positive or negative attitudes based on his/her experiences. Sometimes, however, these attitudes were neutral (ie, only hospital names were mentioned without sentimental attitudes) or ambiguous (ie, positive and negative attitudes coexisted). Based on our observation of approximately 18.45% of the sample (32,065/173,748), 92.03% (29,511/32,065) were identified as being positive or neutral in attitude. In this context, we regarded the frequency of hospital names appearing in positive and neutral mentions as a measure of crowdsourced information, representing parents&#8217; beliefs about the quality of local hospitals. In this study, we did not consider negative mentions about hospitals in measuring crowdsourced information because their occurrence rate was less than 7.97% (2554/32,065) and including them did not affect the results of hospital evaluations. To aggregate the user-generated content that might contribute to constructing geospecific crowdsourced information on this particular topic, we selected candidate online communities on the basis of the number of members and the numbers of threads and messages. The contents of online communities can be divided into 3 levels: threads, messages, and sentences. Threads often contain several messages, whereas messages are short, often composed of only a few sentences or sentence fragments. <xref ref-type="fig" rid="figure2">Figure 2</xref> is a snapshot of the hospital recommendation contents in an online community.</p>
                <p>
                    <xref ref-type="table" rid="table1">Table 1</xref> shows the statistics of the content of the selected online communities for parents on Naver and Daum. We obtained 32,422 threads and over 170,000 messages. Thus, there were an average of 5.36 pediatric hospital&#8211;related discussions per thread among all community members.</p>
                <p>To mine discussions on pediatric hospitals from the 2 major Web portals, we developed a text-mining tool tailored to handle the difficulties inherent to the Korean language and the characteristics of local online communities for parents, as shown in <xref ref-type="fig" rid="figure3">Figure 3</xref>.</p>
                <fig id="figure2" position="float">
                    <label>Figure 2</label>
                    <caption>
                        <p>An example of an online community and the data construction process.</p>
                    </caption>
                    <graphic xlink:href="jmir_v16i2e29_fig2.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
                <table-wrap position="float" id="table1">
                    <label>Table 1</label>
                    <caption>
                        <p>Characteristics of the data extracted from selected online communities hosted by Naver and Daum Web portals.</p>
                    </caption>
                    <table width="590" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="132" />
                        <col width="133" />
                        <col width="133" />
                        <col width="133" />
                        <thead>
                            <tr valign="top">
                                <td>District</td>
                                <td>Threads, n</td>
                                <td>Messages, n</td>
                                <td>Messages per thread, mean</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Seoul</td>
                                <td>10,832</td>
                                <td>54,392</td>
                                <td>5.02</td>
                            </tr>
                            <tr valign="top">
                                <td>Daegu</td>
                                <td>8072</td>
                                <td>47,419</td>
                                <td>5.87</td>
                            </tr>
                            <tr valign="top">
                                <td>Busan</td>
                                <td>5965</td>
                                <td>28,910</td>
                                <td>4.85</td>
                            </tr>
                            <tr valign="top">
                                <td>Daejeon</td>
                                <td>3952</td>
                                <td>22,475</td>
                                <td>5.69</td>
                            </tr>
                            <tr valign="top">
                                <td>Incheon</td>
                                <td>775</td>
                                <td>5184</td>
                                <td>6.69</td>
                            </tr>
                            <tr valign="top">
                                <td>Gwangju</td>
                                <td>2826</td>
                                <td>15,368</td>
                                <td>5.44</td>
                            </tr>
                            <tr valign="top">
                                <td>Total</td>
                                <td>32,422</td>
                                <td>173,748</td>
                                <td>5.36</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <fig id="figure3" position="float">
                    <label>Figure 3</label>
                    <caption>
                        <p>Text mining for hospital name extraction.</p>
                    </caption>
                    <graphic xlink:href="jmir_v16i2e29_fig3.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Step 1: Focused Crawling</title>
                <p>The previously mentioned Web portals, Naver and Daum, operate various kinds of online communities by region and subject. For example, the Naver portal has approximately 2 million communities by region. We observed that each region included at least 1 parents&#8217; community with outstanding members, popularity, and exhibited vigorous use by the members rather than others. We selected these local online communities as our text-mining information sources. Each online community provided a search function that helped us identify Web pages with the keywords &#8220;pediatric&#8221; and &#8220;recommendation.&#8221; The Web pages from selected online communities of parents were crawled and stored in hypertext markup language (HTML) format.</p>
            </sec>
            <sec>
                <title>Step 2: Preprocessing</title>
                <p>We deleted HTML tags and nontextual information, such as images, JavaScript codes, and advertisements from the extracted files. For effective handling of HTML content, we used the Beautiful Soup library, designed in the Python programming language [<xref ref-type="bibr" rid="ref26">26</xref>]. In addition, we only selected candidate messages that recommended or in some way mentioned hospitals to others.</p>
            </sec>
            <sec>
                <title>Step 3: Dictionary-Based Hospital Name Extraction</title>
                <p>When people mention hospitals in a social context in Korean, they can use a range of hospital names, mostly expressed through acronyms or abbreviations. To counter this problem, we built a dictionary of hospital names covering the pediatric hospitals in the 6 South Korean metropolitan cities (ie, Seoul, Daegu, Busan, Daejeon, Gwangju, and Incheon) based on the HIRA website. In the hospital name thesaurus, each hospital name had 3 similar expressions on average. This dictionary was a value (expression) mapping table that added acronyms or abbreviations of every hospital name observed in user-written sentences in the online communities. Using this dictionary, our text-mining module performed a specially designed stepwise expression normalization procedure based on textual similarity computed by edit-distance [<xref ref-type="bibr" rid="ref27">27</xref>] between the synonyms in the dictionary and the expressions in the sentences. This was used to find canonical hospital names for use in raw hospital representations.</p>
            </sec>
            <sec>
                <title>Step 4: Sorting Hospitals</title>
                <p>After we extracted the canonical hospital names from messages, we calculated the hospital name frequency by district. After sorting the names by descending order, we could compare the ranked hospital information with the hospital quality rankings obtained from the HIRA, which were based on antibiotic usage rate.</p>
                <p>We assessed the accuracy of the hospital name extraction through human tagging of a random sample of 9450 messages (5.44%) of the total messages (n=173,748). We achieved a recall (the proportion of hospital names in the original text that were extracted correctly) of 73% and precision (the proportion of hospital names extracted that were correct) of 84%. We calculated the <italic>F</italic>
                    <sub>1</sub> score, the harmonic mean of precision and recall, as <italic>F</italic>
                    <sub>1</sub>=2&#215;(precision)&#215;(recall)/(precision+recall)=77.7%. Although accuracy measures of 80% to 90% are often achieved in named entity extraction in English, such high accuracy in informal texts written in Korean is rare because of various types of acronyms, numbers of misspellings, and frequently appearing incorrect spacing between words. Together with the fact that Korean is an agglutinative language, these factors act as bottlenecks with reference to performance.</p>
            </sec>
            <sec>
                <title>Measuring the Congruence of Crowdsourced Data</title>
                <p>To measure the congruence of crowdsourced data with official government data, we first compared hospital ratings based on antibiotics prescriptions with hospital rankings based on crowdsourced information from online health communities. The congruence of crowdsourced data is then determined based on the conformity of both rankings. For this, we used the following 2 indexes: Kendall tau [<xref ref-type="bibr" rid="ref28">28</xref>] and Spearman rho rank correlation coefficients. Kendall tau is defined as Equation (1) and Spearman rho is calculated as Pearson correltation coefficient based on ranks and average ranks as Equation (2) in <xref ref-type="fig" rid="figure4">Figure 4</xref>.</p>
                <p>Both Kendall tau and Spearman rho range from &#8211;1 to +1. A value of +1 means that the 2 rankings completely agree and a value of &#8211;1 means that the 2 rankings are completely contradictory. Thus, the larger the index value, the greater the correspondence between the objective hospital ranking and crowdsourced ranking, which implies that online users are developing correct crowdsourced information.</p>
                <fig id="figure4" position="float">
                    <label>Figure 4</label>
                    <caption>
                        <p>Definitions of Kendall tau and Spearman rho rank correlation coefficients.</p>
                    </caption>
                    <graphic xlink:href="jmir_v16i2e29_fig4.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Geospecific Sociodemographic Information</title>
                <p>Considering that information exchanges within online health communities occur disparately and are bounded by geographic region, we can examine the demographic information in a given region to identify the particular sociodemographics that influence the congruence of crowdsourced data (ie, the degree of correspondence between government ratings of hospitals in the region and Internet rankings). We selected 6 variables for use in the analysis: birthrate by region, mean and standard deviation of educational attainment for married women, population density, number of pediatric clinics per geographic area, and mean number of doctors per pediatric office. On the basis of previous studies that found pregnant and first-time mothers actively search for online health information, we selected birthrate as the independent variable [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. Gender and education have been found to affect online health searching, specifically women and more educated individuals were found to conduct more online searches [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref32">32</xref>]. Therefore, education of married women was selected as a variable. In addition, we chose 3 other variables for availability of pediatric clinics and possible variation of assessment of doctors. Educational attainment refers to the highest level of education that married women had completed and was categorized into no education, elementary school, middle school, high school, 2-year college, 4-year college, master&#8217;s degree, and PhD. These were then converted into values of 0, 6, 9, 12, 14, 16, 18, and 23 years of schooling, respectively, to calculate the average and standard deviations for education. For population density, we divided the population of each region by its area. Finally, for the number of doctors per pediatric clinic, we divided the total number of pediatric doctors in the region by the total number of pediatric clinics. We also used another variable, availability, to describe the availability of medical services, which was computed by dividing the total number of pediatric clinics in the region by the total population of that region. Finally, birthrate refers to the average number of children per fertile woman. <xref ref-type="table" rid="table2">Tables 2</xref> and <xref ref-type="table" rid="table3">3</xref> describe the variables along with appropriate summary statistics and correlations between independent variables.</p>
                <p>For hospitals recommended within local online communities, grouping them by year could have led to difficulties in comparing rankings because of the limited number of observations per local area. Therefore, we aggregated the number of recommended hospitals in a given region between 2009 and 2012 to compile the rankings. For comparison, we also calculated the average rate of antibiotic prescriptions between 2009 and 2012 to determine the objective hospital ranking.</p>
                <p>For the population, area (km<sup>2</sup>) of a region, and birthrate data, we computed the means for the data provided in the Korean Statistical Information Service (KOSIS) [<xref ref-type="bibr" rid="ref33">33</xref>] for a given period and used them as sociodemographic variables. However, for educational attainment, we had access to 2010 data only, and thus used them as they were. As the number of hospitals and the number of doctors per clinic in each year were unknown, we used the information registered at the HIRA website for 2012. We present all the sources of data in <xref ref-type="table" rid="table4">Table 4</xref>.</p>
                <p>To analyze which sociodemographic features influenced the congruence of crowdsourced data, we ran an ordinary least squares (OLS) regression on the 29 regions, with rank correlation as the dependent variable and the aforementioned 6 sociodemographic characteristics as independent variables.</p>
                <table-wrap position="float" id="table2">
                    <label>Table 2</label>
                    <caption>
                        <p>Summary statistics of variables.</p>
                    </caption>
                    <table width="590" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="83" />
                        <col width="226" />
                        <col width="52" />
                        <col width="43" />
                        <col width="52" />
                        <col width="48" />
                        <thead>
                            <tr valign="top">
                                <td>Variable</td>
                                <td>Description</td>
                                <td>Mean</td>
                                <td>SD</td>
                                <td>Min</td>
                                <td>Max</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Birthrate</td>
                                <td>Birthrate (number of births per fertile woman)</td>
                                <td>1.048</td>
                                <td>0.100</td>
                                <td>0.855</td>
                                <td>1.261</td>
                            </tr>
                            <tr valign="top">
                                <td>Education mean</td>
                                <td>Average educational attainment of married women</td>
                                <td>12.390</td>
                                <td>0.833</td>
                                <td>11.340</td>
                                <td>14.858</td>
                            </tr>
                            <tr valign="top">
                                <td>Education SD</td>
                                <td>Standard deviation of educational attainment of married women</td>
                                <td>3.496</td>
                                <td>0.183</td>
                                <td>3.149</td>
                                <td>3.788</td>
                            </tr>
                            <tr valign="bottom">
                                <td>Population density</td>
                                <td>Population per area (km<sup>2</sup>)</td>
                                <td>0.016</td>
                                <td>0.007</td>
                                <td>0.003</td>
                                <td>0.029</td>
                            </tr>
                            <tr valign="top">
                                <td>Doctors per clinic</td>
                                <td>Number of doctors per pediatric clinic</td>
                                <td>1.641</td>
                                <td>0.396</td>
                                <td>1.167</td>
                                <td>2.889</td>
                            </tr>
                            <tr valign="top">
                                <td>Availability</td>
                                <td>Number of pediatric clinics per 1000 persons</td>
                                <td>0.060</td>
                                <td>0.010</td>
                                <td>0.033</td>
                                <td>0.080</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap position="float" id="table3">
                    <label>Table 3</label>
                    <caption>
                        <p>Correlations between independent variables.</p>
                    </caption>
                    <table width="639" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="73" />
                        <col width="42" />
                        <col width="26" />
                        <col width="37" />
                        <col width="27" />
                        <col width="35" />
                        <col width="28" />
                        <col width="40" />
                        <col width="28" />
                        <col width="34" />
                        <col width="29" />
                        <col width="39" />
                        <col width="17" />
                        <thead>
                            <tr valign="top">
                                <td>Pearson correlation</td>
                                <td colspan="2">Birthrate</td>
                                <td colspan="2">Education mean</td>
                                <td colspan="2">Education SD</td>
                                <td colspan="2">Population density</td>
                                <td colspan="2">Doctors per hospital</td>
                                <td colspan="2">Availability</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <italic>r</italic>
                                </td>
                                <td>
                                    <italic>P</italic>
                                </td>
                                <td>
                                    <italic>r</italic>
                                </td>
                                <td>
                                    <italic>P</italic>
                                </td>
                                <td>
                                    <italic>r</italic>
                                </td>
                                <td>
                                    <italic>P</italic>
                                </td>
                                <td>
                                    <italic>r</italic>
                                </td>
                                <td>
                                    <italic>P</italic>
                                </td>
                                <td>
                                    <italic>r</italic>
                                </td>
                                <td>
                                    <italic>P</italic>
                                </td>
                                <td>
                                    <italic>r</italic>
                                </td>
                                <td>
                                    <italic>P</italic>
                                </td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Birthrate</td>
                                <td>1.00</td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>Education mean</td>
                                <td>&#8211;.27</td>
                                <td>.16</td>
                                <td>1.00</td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>Education SD</td>
                                <td>.03</td>
                                <td>.88</td>
                                <td>&#8211;.34</td>
                                <td>.07</td>
                                <td>1.00</td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>Population density</td>
                                <td>&#8211;.58</td>
                                <td>.001</td>
                                <td>.03</td>
                                <td>.89</td>
                                <td>&#8211;.10</td>
                                <td>.60</td>
                                <td>1.00</td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>Doctors per hospital</td>
                                <td>&#8211;.23</td>
                                <td>.24</td>
                                <td>.27</td>
                                <td>.15</td>
                                <td>.22</td>
                                <td>.24</td>
                                <td>&#8211;.06</td>
                                <td>.74</td>
                                <td>1.00</td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>Availability</td>
                                <td>.11</td>
                                <td>.57</td>
                                <td>.38</td>
                                <td>.04</td>
                                <td>.09</td>
                                <td>.66</td>
                                <td>&#8211;.15</td>
                                <td>.44</td>
                                <td>.26</td>
                                <td>.17</td>
                                <td>1.00</td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap position="float" id="table4">
                    <label>Table 4</label>
                    <caption>
                        <p>Data sources and time periods used.</p>
                    </caption>
                    <table width="544" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="28" />
                        <col width="224" />
                        <col width="137" />
                        <col width="96" />
                        <thead>
                            <tr valign="top">
                                <td colspan="2">Information type and source</td>
                                <td>Data</td>
                                <td>Period</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td colspan="2">
                                    <bold>Official government data</bold>
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Health Insurance Review &#38; Assessment Service (HIRA)</td>
                                <td>Antibiotic prescription rate</td>
                                <td>2009-2012 (Average)</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td># of hospitals</td>
                                <td>2013</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td># of doctors</td>
                                <td>2013</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">
                                    <bold>Crowdsourced data from online communities</bold>
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Web portals (Daum, Naver)</td>
                                <td># of recommended hospitals</td>
                                <td>2009-2012 (Sum)</td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">
                                    <bold>Geospecific demographic information</bold>
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Korean Statistical Information Service (KOSIS)</td>
                                <td>Population</td>
                                <td>2009-2012 (Average)</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>Area of a region</td>
                                <td>2009-2012 (Average)</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>Birthrate</td>
                                <td>2009-2012 (Average)</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>Education</td>
                                <td>2010</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <sec>
                <title>Rank Correlations</title>
                <p>
                    <xref ref-type="table" rid="table5">Table 5</xref> shows the rank correlation coefficients by region for 29 of the 30 regions. We excluded Jongno-gu in Seoul because it had relatively few online communities.</p>
                <p>As seen in <xref ref-type="table" rid="table5">Table 5</xref>, significant variations in Kendall tau and Spearman rho scores exist across regions, with the lowest for region S7 and highest for region S8.</p>
                <table-wrap position="float" id="table5">
                    <label>Table 5</label>
                    <caption>
                        <p>Congruence of geospecific crowdsourced health information.</p>
                    </caption>
                    <table width="472" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="59" />
                        <col width="46" />
                        <col width="98" />
                        <col width="43" />
                        <col width="94" />
                        <col width="46" />
                        <thead>
                            <tr valign="bottom">
                                <td>District<sup>a</sup>
                                </td>
                                <td>n<sup>b</sup>
                                </td>
                                <td>Kendall tau</td>
                                <td>Rank</td>
                                <td>Spearman rho</td>
                                <td>Rank</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>S1</td>
                                <td>14</td>
                                <td>0.132</td>
                                <td>11</td>
                                <td>0.152</td>
                                <td>11</td>
                            </tr>
                            <tr valign="top">
                                <td>S2</td>
                                <td>21</td>
                                <td>0.214</td>
                                <td>8</td>
                                <td>0.292</td>
                                <td>9</td>
                            </tr>
                            <tr valign="top">
                                <td>S3</td>
                                <td>11</td>
                                <td>0.255</td>
                                <td>7</td>
                                <td>0.330</td>
                                <td>7</td>
                            </tr>
                            <tr valign="top">
                                <td>S4</td>
                                <td>15</td>
                                <td>0.038</td>
                                <td>18</td>
                                <td>0.040</td>
                                <td>18</td>
                            </tr>
                            <tr valign="top">
                                <td>S5</td>
                                <td>15</td>
                                <td>0.438</td>
                                <td>2</td>
                                <td>0.587</td>
                                <td>2</td>
                            </tr>
                            <tr valign="top">
                                <td>S6</td>
                                <td>17</td>
                                <td>0.265</td>
                                <td>6</td>
                                <td>0.415</td>
                                <td>6</td>
                            </tr>
                            <tr valign="top">
                                <td>S7</td>
                                <td>11</td>
                                <td>&#8211;0.346</td>
                                <td>28</td>
                                <td>&#8211;0.466</td>
                                <td>28</td>
                            </tr>
                            <tr valign="top">
                                <td>S8</td>
                                <td>5</td>
                                <td>0.5</td>
                                <td>1</td>
                                <td>0.667</td>
                                <td>1</td>
                            </tr>
                            <tr valign="top">
                                <td>S9</td>
                                <td>22</td>
                                <td>0.052</td>
                                <td>15</td>
                                <td>0.093</td>
                                <td>12</td>
                            </tr>
                            <tr valign="top">
                                <td>S10</td>
                                <td>10</td>
                                <td>&#8211;0.089</td>
                                <td>23</td>
                                <td>&#8211;0.109</td>
                                <td>22</td>
                            </tr>
                            <tr valign="top">
                                <td>S11</td>
                                <td>11</td>
                                <td>0.382</td>
                                <td>3</td>
                                <td>0.441</td>
                                <td>5</td>
                            </tr>
                            <tr valign="top">
                                <td>S12</td>
                                <td>12</td>
                                <td>&#8211;0.182</td>
                                <td>25</td>
                                <td>&#8211;0.232</td>
                                <td>24</td>
                            </tr>
                            <tr valign="top">
                                <td>S13</td>
                                <td>15</td>
                                <td>0.210</td>
                                <td>9</td>
                                <td>0.321</td>
                                <td>8</td>
                            </tr>
                            <tr valign="top">
                                <td>S14</td>
                                <td>13</td>
                                <td>&#8211;0.077</td>
                                <td>22</td>
                                <td>&#8211;0.135</td>
                                <td>23</td>
                            </tr>
                            <tr valign="top">
                                <td>S15</td>
                                <td>11</td>
                                <td>0.327</td>
                                <td>5</td>
                                <td>0.471</td>
                                <td>3</td>
                            </tr>
                            <tr valign="top">
                                <td>S16</td>
                                <td>11</td>
                                <td>&#8211;0.236</td>
                                <td>27</td>
                                <td>&#8211;0.340</td>
                                <td>27</td>
                            </tr>
                            <tr valign="top">
                                <td>S17</td>
                                <td>10</td>
                                <td>&#8211;0.156</td>
                                <td>24</td>
                                <td>&#8211;0.268</td>
                                <td>25</td>
                            </tr>
                            <tr valign="top">
                                <td>S18</td>
                                <td>26</td>
                                <td>0.04</td>
                                <td>16</td>
                                <td>0.055</td>
                                <td>17</td>
                            </tr>
                            <tr valign="top">
                                <td>S19</td>
                                <td>18</td>
                                <td>&#8211;0.235</td>
                                <td>26</td>
                                <td>&#8211;0.326</td>
                                <td>26</td>
                            </tr>
                            <tr valign="top">
                                <td>S20</td>
                                <td>15</td>
                                <td>0.086</td>
                                <td>12</td>
                                <td>0.080</td>
                                <td>13</td>
                            </tr>
                            <tr valign="top">
                                <td>S21</td>
                                <td>8</td>
                                <td>&#8211;0.357</td>
                                <td>29</td>
                                <td>&#8211;0.470</td>
                                <td>29</td>
                            </tr>
                            <tr valign="top">
                                <td>S22</td>
                                <td>16</td>
                                <td>0.35</td>
                                <td>4</td>
                                <td>0.458</td>
                                <td>4</td>
                            </tr>
                            <tr valign="top">
                                <td>S24</td>
                                <td>3</td>
                                <td>0.00</td>
                                <td>20</td>
                                <td>0.000</td>
                                <td>20</td>
                            </tr>
                            <tr valign="top">
                                <td>S25</td>
                                <td>12</td>
                                <td>0.061</td>
                                <td>13</td>
                                <td>0.078</td>
                                <td>14</td>
                            </tr>
                            <tr valign="top">
                                <td>Gwangju</td>
                                <td>57</td>
                                <td>0.040</td>
                                <td>16</td>
                                <td>0.060</td>
                                <td>16</td>
                            </tr>
                            <tr valign="top">
                                <td>Daegu</td>
                                <td>99</td>
                                <td>0.180</td>
                                <td>10</td>
                                <td>0.268</td>
                                <td>10</td>
                            </tr>
                            <tr valign="top">
                                <td>Daejeon</td>
                                <td>53</td>
                                <td>0.025</td>
                                <td>19</td>
                                <td>0.040</td>
                                <td>18</td>
                            </tr>
                            <tr valign="top">
                                <td>Busan</td>
                                <td>155</td>
                                <td>0.056</td>
                                <td>14</td>
                                <td>0.078</td>
                                <td>14</td>
                            </tr>
                            <tr valign="top">
                                <td>Incheon</td>
                                <td>93</td>
                                <td>&#8211;0.006</td>
                                <td>21</td>
                                <td>&#8211;0.001</td>
                                <td>21</td>
                            </tr>
                            <tr valign="top">
                                <td>Total</td>
                                <td>779</td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                                <td>
                                    <break />
                                </td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table5fn1">
                            <p>
                                <sup>a</sup> S means Seoul and S1 represents district (gu) 1 of Seoul. S23 is Jongno-gu. Matched district names are listed in <xref ref-type="fig" rid="figure2">Figure 2</xref>.</p>
                        </fn>
                        <fn id="table5fn2">
                            <p>
                                <sup>b</sup> Number of pediatric clinics that were mentioned on online communities.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
            </sec>
            <sec>
                <title>Ordinary Least Squares Regression Results</title>
                <p>
                    <xref ref-type="table" rid="table6">Table 6</xref> shows the OLS regression results that we obtained (adjusted <italic>R</italic>
                    <sup>
                        <italic>2</italic>
                    </sup>=.334). All independent variables, except availability, had negative coefficient values. Birthrate and number of doctors per clinic significantly lowered the congruence of crowdsourced data with official government data at the 1% level, whereas the standard deviation of educational attainment and population density negatively affected congruence at a significance level of 5%. However, the variables of average education attainment and number of hospitals per 1000 people were not statistically significant. In terms of each independent variable, our study showed that the higher the birthrate in a given region, the larger the standard deviation of educational attainment, the higher the population density, and the greater the number of doctors per clinic, the more likely that the crowdsourced data within online communities in a given region was less congruent. We observed similar findings when we used the Spearman rho rank correlation coefficient instead of Kendall tau for ranking comparisons in the OLS regression analysis (adjusted <italic>R</italic>
                    <sup>
                        <italic>2</italic>
                    </sup>=.364).</p>
                <table-wrap position="float" id="table6">
                    <label>Table 6</label>
                    <caption>
                        <p>Parameter estimates and standard errors.</p>
                    </caption>
                    <table width="623" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                        <col width="109" />
                        <col width="63" />
                        <col width="46" />
                        <col width="49" />
                        <col width="79" />
                        <col width="72" />
                        <col width="44" />
                        <col width="47" />
                        <thead>
                            <tr valign="bottom">
                                <td>Independent variable</td>
                                <td colspan="3">Kendall tau</td>
                                <td>Standardized coefficient<sup>a</sup>
                                </td>
                                <td colspan="3">Spearman rho</td>
                            </tr>
                            <tr valign="top">
                                <td>
                                    <break />
                                </td>
                                <td>Coefficient</td>
                                <td>SE</td>
                                <td>
                                    <italic>P</italic> value</td>
                                <td>
                                    <break />
                                </td>
                                <td>Coefficient</td>
                                <td>SE</td>
                                <td>
                                    <italic>P</italic> value</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Birthrate</td>
                                <td>&#8211;1.678</td>
                                <td>0.477</td>
                                <td>.002</td>
                                <td>&#8211;0.748</td>
                                <td>&#8211;2.302</td>
                                <td>0.633</td>
                                <td>.001</td>
                            </tr>
                            <tr valign="top">
                                <td>Education mean</td>
                                <td>&#8211;0.091</td>
                                <td>0.055</td>
                                <td>.12</td>
                                <td>&#8211;0.335</td>
                                <td>&#8211;0.117</td>
                                <td>0.073</td>
                                <td>.12</td>
                            </tr>
                            <tr valign="top">
                                <td>Education SD</td>
                                <td>&#8211;0.471</td>
                                <td>0.223</td>
                                <td>.046</td>
                                <td>&#8211;0.382</td>
                                <td>&#8211;0.636</td>
                                <td>0.296</td>
                                <td>.04</td>
                            </tr>
                            <tr valign="top">
                                <td>Population density</td>
                                <td>&#8211;16.860</td>
                                <td>6.244</td>
                                <td>.01</td>
                                <td>&#8211;0.532</td>
                                <td>&#8211;24.077</td>
                                <td>8.282</td>
                                <td>.008</td>
                            </tr>
                            <tr valign="top">
                                <td>Doctors per clinic</td>
                                <td>&#8211;0.212</td>
                                <td>0.101</td>
                                <td>.048</td>
                                <td>&#8211;0.373</td>
                                <td>&#8211;0.311</td>
                                <td>0.134</td>
                                <td>.03</td>
                            </tr>
                            <tr valign="top">
                                <td>Availability</td>
                                <td>2.611</td>
                                <td>4.077</td>
                                <td>.53</td>
                                <td>0.116</td>
                                <td>3.797</td>
                                <td>5.407</td>
                                <td>.49</td>
                            </tr>
                            <tr valign="top">
                                <td>Constant</td>
                                <td>5.051</td>
                                <td>1.407</td>
                                <td>.002</td>
                                <td>
                                    <break />
                                </td>
                                <td>6.837</td>
                                <td>1.866</td>
                                <td>.001</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table6fn1">
                            <p>
                                <sup>a</sup> Standardized coefficients are the regression coefficients obtained by first standardizing all variables to have a mean of 0 and a standard deviation of 1.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
                <p>We also standardized the coefficients to better compare the impact of the variables. Birthrate had the largest standardized coefficient whereas doctors per clinic had the smallest. We found that we could interpret the value of standardized coefficients (ie, a 1 SD decrease in birthrate led to a 0.75 SD increase in predicted Kendall tau, with the other variables held constant). Similarly, a 1 SD decrease in doctors per clinic yielded a 0.37 SD increase in the predicted Kendall tau. These results, presented in <xref ref-type="table" rid="table6">Table 6</xref>, can explain the variations in Kendall tau values across districts we observed in <xref ref-type="table" rid="table5">Table 5</xref>.</p>
                <p>For illustration purposes, we compared 2 districts in Seoul: S5 (with a relatively high Kendall tau of 0.44) and S18 (with a low Kendall tau of 0.04). Large differences in demographic characteristics between S5 and S8 in birthrate (0.897 vs 1.042) and doctors per clinic (1.185 vs 1.808) explained why S5 had a higher Kendall tau value. Similarly, we could explain the difference in congruence of crowdsourced data between the local cities. For instance, a higher Kendall tau value for Daegu in comparison to that for Daejeon was associated with Daegu&#8217;s lower birth rate, standard deviation of educational attainment, and number of doctors per clinic.</p>
                <p>A higher birthrate in a region implies that there is greater percentage of women with children under age 2 years who have relatively less experience with pediatric clinics. As a result, the proportion of women seeking and sharing information on pediatric hospitals in online communities may be greater for regions with higher birthrates compared with other regions. This can explain why the congruence of crowdsourced data is likely to be lower in a region with higher birthrates. Interestingly, our findings also showed that the average educational attainment of married women in a region was not significantly related to the level of congruence; however, this was not the case for the standard deviation of educational attainment, which had a significant negative relationship with the congruence of crowdsourced data. This difference may be because of the potential mingling of correct and misleading information in the exchange of hospital information in online communities, where users do not have any knowledge of the educational attainment of other users. It is also likely that more densely populated regions are more likely to have a greater number of people gathering pediatric hospital information through offline channels (ie, nearby friends or relatives) than through online communities. In other words, crowdsourced information is created from face-to-face interactions&#8212;an offline channel&#8212;meaning that there is no definitive build-up of online crowdsourcing in this case. Finally, the greater the number of doctors per clinic, the higher the chances of people may build up less congruent crowdsourced information on these hospitals. This can be explained by the notion that people often judge the same hospital differently according to the doctor they visit; thus, there would be a greater variations in users&#8217; evaluations of a hospital with a large number of doctors as opposed to a smaller number.</p>
            </sec>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <p>Although patients actively create and exchange health information in this era of Health 2.0, the spread of inaccurate health information can have a potentially negative effect on public health because of its direct impact on patients&#8217; health conditions. Hence, in this study, we investigated the congruence between crowdsourced information and official government data in the health care domain and geospecific determinants of misinformation across South Korea. In particular, this is the first attempt in the literature to associate the results of data mining from geospecific online health communities with sociodemographic characteristics of regions.</p>
            <p>We found that the quality of crowdsourced information on health care services varies across regions and that these variations can be explained by geospecific demographic factors, such as birthrate, educational attainment, population density, and the number of doctors per clinic. The findings of our study hold practical implications for health policies. From our research, we suggest that government authorities should recognize the power of crowdsourcing and make efforts to reduce the potential risk of low quality health information and the accompanying safety issues. Crowdsourcing for health care services, unlike that for general products and services, is based on contributions from nonspecialists. Furthermore, the quality of crowdsourced information can be lower for pediatric clinics in particular because parents serve as agents for their children who can seldom self-diagnose the various symptoms they are suffering. Therefore, our findings also suggest the need for governmental efforts to counterbalance the misinformation by disseminating approval ratings of pediatric clinics via geospecific online health communities, and that this can be accomplished by prioritizing the regions with the lowest information quality levels.</p>
            <p>This study also had some limitations. Although we collected data on major online communities with many active users by region, we did not fully evaluate all hospitals in each region. However, as we confined our focus to online communities on pediatrics with a relatively large number of users&#8212;consisting of typical mothers of young children&#8212;we can say that the hospital list by region extracted using text-mining techniques was quite reliable in practice. In addition, although the text mining showed reasonable performance in the Korean language, performance could be enhanced through anaphora resolution of hospital names. It should be noted that the context of an Internet forum is disorganized and the language used tends to follow the idiosyncratic nature of human beings rather than grammatical standards and rules. Therefore, in our future research, we plan to extend the application of the text-mining tool to sentiment analysis and the specific textual relationships between qualitative factors that influence people&#8217;s choice of hospitals. In that way, we hope we can draw more practical implications for health policies.</p>
        </sec>
    </body>
    <back>
        <glossary>
            <title>Abbreviations</title>
            <def-list>
                <def-item>
                    <term id="abb1">HIRA</term>
                    <def>
                        <p>Health Insurance Review and Assessment</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb2">HTML</term>
                    <def>
                        <p>hypertext markup language</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb3">KOSIS</term>
                    <def>
                        <p>Korean Statistical Information Service</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb4">OLS</term>
                    <def>
                        <p>ordinary least squares</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb5">SARS</term>
                    <def>
                        <p>severe acute respiratory syndrome</p>
                    </def>
                </def-item>
            </def-list>
        </glossary>
        <fn-group>
            <fn fn-type="conflict">
                <p>None declared.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>O'Reilly</surname>
                            <given-names>T</given-names>
                        </name>
                    </person-group>
                    <source>O&#039;Reilly Media Inc</source>
                    <year>2005</year>
                    <access-date>2014-01-19</access-date>
                    <comment>What is Web 2.0: design patterns and business models for the next generation of software<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://oreilly.com/web2/archive/what-is-web-20.html">http://oreilly.com/web2/archive/what-is-web-20.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6MiXNbMo1</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Consumer health informatics</article-title>
                    <source>BMJ</source>
                    <year>2000</year>
                    <month>06</month>
                    <day>24</day>
                    <volume>320</volume>
                    <issue>7251</issue>
                    <fpage>1713</fpage>
                    <lpage>6</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/10864552" />
                    </comment>
                    <pub-id pub-id-type="medline">10864552</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1127483</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wicks</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Massagli</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Frost</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brownstein</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Okun</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Vaughan</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bradley</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Heywood</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Sharing health data for better outcomes on PatientsLikeMe</article-title>
                    <source>J Med Internet Res</source>
                    <year>2010</year>
                    <volume>12</volume>
                    <issue>2</issue>
                    <fpage>e19</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2010/2/e19/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.1549</pub-id>
                    <pub-id pub-id-type="medline">20542858</pub-id>
                    <pub-id pub-id-type="pii">v12i2e19</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2956230</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hawn</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>Take two aspirin and tweet me in the morning: how Twitter, Facebook, and other social media are reshaping health care</article-title>
                    <source>Health Aff (Millwood)</source>
                    <year>2009</year>
                    <month>03</month>
                    <volume>28</volume>
                    <issue>2</issue>
                    <fpage>361</fpage>
                    <lpage>8</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://content.healthaffairs.org/cgi/pmidlookup?view=long&#38;pmid=19275991" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1377/hlthaff.28.2.361</pub-id>
                    <pub-id pub-id-type="medline">19275991</pub-id>
                    <pub-id pub-id-type="pii">28/2/361</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Gao</surname>
                            <given-names>GG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>McCullough</surname>
                            <given-names>JS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Agarwal</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jha</surname>
                            <given-names>AK</given-names>
                        </name>
                    </person-group>
                    <article-title>A changing landscape of physician quality reporting: analysis of patients' online ratings of their physicians over a 5-year period</article-title>
                    <source>J Med Internet Res</source>
                    <year>2012</year>
                    <month>02</month>
                    <volume>14</volume>
                    <issue>1</issue>
                    <fpage>e38</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2012/1/e38/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2003</pub-id>
                    <pub-id pub-id-type="medline">22366336</pub-id>
                    <pub-id pub-id-type="pii">v14i1e38</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3374528</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Popoiu</surname>
                            <given-names>MC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Grosseck</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Holotescu</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>What do we know about the use of social media in medical education?</article-title>
                    <source>Procedia - Social and Behavioral Sciences</source>
                    <year>2012</year>
                    <month>1</month>
                    <conf-name>4th World Conference on Educational Sciences (WCES-2012) 02-05</conf-name>
                    <conf-date>February 2012</conf-date>
                    <conf-loc>Barcelona, Spain</conf-loc>
                    <fpage>2262</fpage>
                    <lpage>2266</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.sbspro.2012.05.466</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Infodemiology: the epidemiology of (mis)information</article-title>
                    <source>The American Journal of Medicine</source>
                    <year>2002</year>
                    <month>12</month>
                    <day>15</day>
                    <volume>113</volume>
                    <issue>9</issue>
                    <fpage>763</fpage>
                    <lpage>765</lpage>
                    <pub-id pub-id-type="doi">10.1016/S0002-9343(02)01473-0</pub-id>
                    <pub-id pub-id-type="medline">12517369</pub-id>
                    <pub-id pub-id-type="pii">S0002934302014730</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>Infodemiology and infoveillance: framework for an emerging set of public health informatics methods to analyze search, communication and publication behavior on the Internet</article-title>
                    <source>J Med Internet Res</source>
                    <year>2009</year>
                    <month>03</month>
                    <volume>11</volume>
                    <issue>1</issue>
                    <fpage>e11</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2009/1/e11/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.1157</pub-id>
                    <pub-id pub-id-type="medline">19329408</pub-id>
                    <pub-id pub-id-type="pii">v11i1e11</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2762766</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Marcus</surname>
                            <given-names>MA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Westra</surname>
                            <given-names>HA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Eastwood</surname>
                            <given-names>JD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Barnes</surname>
                            <given-names>KL</given-names>
                        </name>
                        <collab>Mobilizing Minds Research Group</collab>
                    </person-group>
                    <article-title>What are young adults saying about mental health? An analysis of Internet blogs</article-title>
                    <source>J Med Internet Res</source>
                    <year>2012</year>
                    <month>01</month>
                    <volume>14</volume>
                    <issue>1</issue>
                    <fpage>e17</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2012/1/e17/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.1868</pub-id>
                    <pub-id pub-id-type="medline">22569642</pub-id>
                    <pub-id pub-id-type="pii">v14i1e17</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3374526</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Greaves</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ramirez-Cano</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Millett</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Darzi</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Donaldson</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Use of sentiment analysis for capturing patient experience from free-text comments posted online</article-title>
                    <source>J Med Internet Res</source>
                    <year>2013</year>
                    <volume>15</volume>
                    <issue>11</issue>
                    <fpage>e239</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/11/e239/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2721</pub-id>
                    <pub-id pub-id-type="medline">24184993</pub-id>
                    <pub-id pub-id-type="pii">v15i11e239</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3841376</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Powell</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kuss</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sa</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Empirical Studies Assessing the Quality of Health Information for Consumers on the World Wide Web</article-title>
                    <source>JAMA</source>
                    <year>2002</year>
                    <month>05</month>
                    <day>22</day>
                    <volume>287</volume>
                    <issue>20</issue>
                    <fpage>2691</fpage>
                    <lpage>700</lpage>
                    <pub-id pub-id-type="doi">10.1001/jama.287.20.2691</pub-id>
                    <pub-id pub-id-type="medline">12020305</pub-id>
                    <pub-id pub-id-type="pii">jrv10005</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Morahan-Martin</surname>
                            <given-names>JM</given-names>
                        </name>
                    </person-group>
                    <article-title>How internet users find, evaluate, and use online health information: a cross-cultural review</article-title>
                    <source>Cyberpsychol Behav</source>
                    <year>2004</year>
                    <month>10</month>
                    <volume>7</volume>
                    <issue>5</issue>
                    <fpage>497</fpage>
                    <lpage>510</lpage>
                    <pub-id pub-id-type="medline">15667044</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Skinner</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Biscope</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Poland</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Goldberg</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>How adolescents use technology for health information: implications for health professionals from focus group studies</article-title>
                    <source>J Med Internet Res</source>
                    <year>2003</year>
                    <month>12</month>
                    <day>18</day>
                    <volume>5</volume>
                    <issue>4</issue>
                    <fpage>e32</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2003/4/e32/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.5.4.e32</pub-id>
                    <pub-id pub-id-type="medline">14713660</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1550577</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Tsai</surname>
                            <given-names>CC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tsai</surname>
                            <given-names>SH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zeng-Treitler</surname>
                            <given-names>Q</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Liang</surname>
                            <given-names>BA</given-names>
                        </name>
                    </person-group>
                    <article-title>Patient-centered consumer health social network websites: a pilot study of quality of user-generated health information</article-title>
                    <source>AMIA Annu Symp Proc</source>
                    <year>2007</year>
                    <month>10</month>
                    <conf-name>Proceedings of the Annual Symposium of the American Medical Informatics Association</conf-name>
                    <conf-date>2007</conf-date>
                    <conf-loc>Chicago, IL</conf-loc>
                    <fpage>1137</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Clauson</surname>
                            <given-names>KA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Polen</surname>
                            <given-names>HH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Boulos</surname>
                            <given-names>MN</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dzenowagis</surname>
                            <given-names>JH</given-names>
                        </name>
                    </person-group>
                    <article-title>Scope, completeness, and accuracy of drug information in Wikipedia</article-title>
                    <source>Ann Pharmacother</source>
                    <year>2008</year>
                    <month>12</month>
                    <volume>42</volume>
                    <issue>12</issue>
                    <fpage>1814</fpage>
                    <lpage>21</lpage>
                    <pub-id pub-id-type="doi">10.1345/aph.1L474</pub-id>
                    <pub-id pub-id-type="medline">19017825</pub-id>
                    <pub-id pub-id-type="pii">aph.1L474</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Plantin</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Daneback</surname>
                            <given-names>K</given-names>
                        </name>
                    </person-group>
                    <article-title>Parenthood, information and support on the internet. A literature review of research on parents and professionals online</article-title>
                    <source>BMC Fam Pract</source>
                    <year>2009</year>
                    <volume>10</volume>
                    <fpage>34</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.biomedcentral.com/1471-2296/10/34" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1186/1471-2296-10-34</pub-id>
                    <pub-id pub-id-type="medline">19450251</pub-id>
                    <pub-id pub-id-type="pii">1471-2296-10-34</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2694765</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Stern</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cotten</surname>
                            <given-names>SR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Drentea</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>The separate spheres of online health: gender, parenting, and online health information searching in the information age</article-title>
                    <source>Journal of Family Issues</source>
                    <year>2011</year>
                    <month>10</month>
                    <day>21</day>
                    <volume>33</volume>
                    <issue>10</issue>
                    <fpage>1324</fpage>
                    <lpage>1350</lpage>
                    <pub-id pub-id-type="doi">10.1177/0192513X11425459</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Weissman</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Besser</surname>
                            <given-names>RE</given-names>
                        </name>
                    </person-group>
                    <article-title>Promoting appropriate antibiotic use for pediatric patients: a social ecological framework</article-title>
                    <source>Semin Pediatr Infect Dis</source>
                    <year>2004</year>
                    <month>01</month>
                    <volume>15</volume>
                    <issue>1</issue>
                    <fpage>41</fpage>
                    <lpage>51</lpage>
                    <pub-id pub-id-type="medline">15175994</pub-id>
                    <pub-id pub-id-type="pii">S1045187004000056</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Paluck</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Katzenstein</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Frankish</surname>
                            <given-names>CJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Herbert</surname>
                            <given-names>CP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Milner</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Speert</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chambers</surname>
                            <given-names>K</given-names>
                        </name>
                    </person-group>
                    <article-title>Prescribing practices and attitudes toward giving children antibiotics</article-title>
                    <source>Can Fam Physician</source>
                    <year>2001</year>
                    <month>03</month>
                    <volume>47</volume>
                    <fpage>521</fpage>
                    <lpage>7</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.cfp.ca/cgi/pmidlookup?view=long&#38;pmid=11281085" />
                    </comment>
                    <pub-id pub-id-type="medline">11281085</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2018393</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mainous</surname>
                            <given-names>AG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hueston</surname>
                            <given-names>WJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Love</surname>
                            <given-names>MM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Evans</surname>
                            <given-names>ME</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Finger</surname>
                            <given-names>R</given-names>
                        </name>
                    </person-group>
                    <article-title>An evaluation of statewide strategies to reduce antibiotic overuse</article-title>
                    <source>Fam Med</source>
                    <year>2000</year>
                    <month>01</month>
                    <volume>32</volume>
                    <issue>1</issue>
                    <fpage>22</fpage>
                    <lpage>9</lpage>
                    <pub-id pub-id-type="medline">10645510</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kim</surname>
                            <given-names>B</given-names>
                        </name>
                    </person-group>
                    <article-title>Overview of antibiotic use in Korea</article-title>
                    <source>Infect Chemother</source>
                    <year>2012</year>
                    <volume>44</volume>
                    <issue>4</issue>
                    <fpage>250</fpage>
                    <pub-id pub-id-type="doi">10.3947/ic.2012.44.4.250</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <nlm-citation citation-type="web">
                    <source>Health insurance review and assessment service</source>
                    <access-date>2013-10-28</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.hira.or.kr/">http://www.hira.or.kr/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6Ki5geHrV</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <nlm-citation citation-type="web">
                    <source>NAVER Corp</source>
                    <access-date>2013-10-28</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.naver.com/">http://www.naver.com/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6Ki54BAEM</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <nlm-citation citation-type="web">
                    <source>Daum communications</source>
                    <access-date>2013-10-28</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.daum.net/">http://www.daum.net/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6Ki7w7xVe</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <nlm-citation citation-type="web">
                    <source>Internet Trend</source>
                    <access-date>2013-10-28</access-date>
                    <comment>Search engine market share<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.internettrend.co.kr/trendForward.tsp">http://www.internettrend.co.kr/trendForward.tsp</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6Ki6hA4Km</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Leonard</surname>
                            <given-names>R</given-names>
                        </name>
                    </person-group>
                    <source>Beautiful Soup</source>
                    <access-date>2013-10-28</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.crummy.com/software/BeautifulSoup/">http://www.crummy.com/software/BeautifulSoup/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6Ki6tNAXD</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Vilares</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ribadas</surname>
                            <given-names>FJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Vilares</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Phrase similarity through the edit distance</article-title>
                    <source>Database and Expert Systems Applications</source>
                    <year>2004</year>
                    <publisher-loc>Berlin</publisher-loc>
                    <publisher-name>Springer</publisher-name>
                    <fpage>306</fpage>
                    <lpage>317</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kendall</surname>
                            <given-names>MG</given-names>
                        </name>
                    </person-group>
                    <article-title>A new measure of rank correlation</article-title>
                    <source>Biometrika</source>
                    <year>1938</year>
                    <month>06</month>
                    <volume>30</volume>
                    <issue>1/2</issue>
                    <fpage>81</fpage>
                    <lpage>93</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref29">
                <label>29</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Daneback</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Plantin</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Research on parenthood and the internet: themes and trends</article-title>
                    <source>Cyberpsychology: Journal of Psychosocial Research on Cyberspace</source>
                    <year>2008</year>
                    <volume>2</volume>
                    <issue>2</issue>
                    <fpage>article2</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://cyberpsychology.eu/view.php?cisloclanku=2008110701&#38;article=2" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref30">
                <label>30</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Rice</surname>
                            <given-names>RE</given-names>
                        </name>
                    </person-group>
                    <article-title>Influences, usage, and outcomes of Internet health information searching: multivariate results from the Pew surveys</article-title>
                    <source>Int J Med Inform</source>
                    <year>2006</year>
                    <month>01</month>
                    <volume>75</volume>
                    <issue>1</issue>
                    <fpage>8</fpage>
                    <lpage>28</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2005.07.032</pub-id>
                    <pub-id pub-id-type="medline">16125453</pub-id>
                    <pub-id pub-id-type="pii">S1386-5056(05)00146-2</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref31">
                <label>31</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cotten</surname>
                            <given-names>SR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gupta</surname>
                            <given-names>SS</given-names>
                        </name>
                    </person-group>
                    <article-title>Characteristics of online and offline health information seekers and factors that discriminate between them</article-title>
                    <source>Soc Sci Med</source>
                    <year>2004</year>
                    <month>11</month>
                    <volume>59</volume>
                    <issue>9</issue>
                    <fpage>1795</fpage>
                    <lpage>806</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.socscimed.2004.02.020</pub-id>
                    <pub-id pub-id-type="medline">15312915</pub-id>
                    <pub-id pub-id-type="pii">S0277953604000796</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref32">
                <label>32</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hale</surname>
                            <given-names>TM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cotten</surname>
                            <given-names>SR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Drentea</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Goldner</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Rural-urban differences in general and health-related internet use</article-title>
                    <source>American Behavioral Scientist</source>
                    <year>2010</year>
                    <month>03</month>
                    <day>09</day>
                    <volume>53</volume>
                    <issue>9</issue>
                    <fpage>1304</fpage>
                    <lpage>1325</lpage>
                    <pub-id pub-id-type="doi">10.1177/0002764210361685</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref33">
                <label>33</label>
                <nlm-citation citation-type="web">
                    <source>Statistics Korea</source>
                    <access-date>2013-10-28</access-date>
                    <comment>Korean statistical information service<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://kosis.kr/">http://kosis.kr/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6Ki7kxFCu</pub-id>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>