<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">JMIR</journal-id>
            <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
            <journal-title>Journal of Medical Internet Research</journal-title>
            <issn pub-type="epub">1438-8871</issn>
            <publisher>
                <publisher-name>Gunther Eysenbach</publisher-name>
                <publisher-loc>JMIR Publications Inc., Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v14i1e22</article-id>
            <article-id pub-id-type="pmid">22356723</article-id>
            <article-id pub-id-type="doi">10.2196/jmir.1985</article-id>
            <article-categories>
                <subj-group subj-group-type="article-type">
                    <subject>Original Paper</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>HealthTrust: A Social Network Approach for Retrieving Online Health Videos</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="editor">
                    <name>
                        <surname>Eysenbach</surname>
                        <given-names>Gunther</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Denecke</surname>
                        <given-names>Kerstin</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Lau</surname>
                        <given-names>Annie</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1" corresp="yes">
                    <name name-style="western">
                        <surname>Fernandez-Luque</surname>
                        <given-names>Luis</given-names>
                    </name>
                    <degrees>MSc</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                    <address>
                        <institution>Northern Research Institute</institution>
                        <addr-line>Postboks 6434 Forskningsparken</addr-line>
                        <addr-line>Tromsø, 9294</addr-line>
                        <country>Norway</country>
                        <phone>47 93421287</phone>
                        <fax>47 77629401</fax>
                        <email>luis.luque@norut.no</email>
                    </address>
                    <xref ref-type="aff" rid="aff2">2</xref>
                </contrib>
                <contrib contrib-type="author" id="contrib2">
                    <name name-style="western">
                        <surname>Karlsen</surname>
                        <given-names>Randi</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref ref-type="aff" rid="aff1">1</xref>
                    <xref ref-type="aff" rid="aff2">2</xref>
                </contrib>
                <contrib contrib-type="author" id="contrib3">
                    <name name-style="western">
                        <surname>Melton</surname>
                        <given-names>Genevieve B</given-names>
                    </name>
                    <degrees>MA, MD</degrees>
                    <xref ref-type="aff" rid="aff3">3</xref>
                </contrib>
            </contrib-group>
            <aff id="aff1" rid="aff1">
                <sup>1</sup>
                <institution>Northern Research Institute</institution>
                <addr-line>Troms&#248;</addr-line>
                <country>Norway</country>
            </aff>
            <aff id="aff2" rid="aff2">
                <sup>2</sup>
                <institution>Computer Science Department</institution>
                <institution>University of Troms&#248;</institution>
                <addr-line>Troms&#248;</addr-line>
                <country>Norway</country>
            </aff>
            <aff id="aff3" rid="aff3">
                <sup>3</sup>
                <institution>Institute for Health Informatics</institution>
                <institution>University of Minnesota</institution>
                <addr-line>Minneapolis, MN</addr-line>
                <country>United States</country>
            </aff>
            <pub-date pub-type="collection">
                <season>Jan-Feb</season>
                <year>2012</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>31</day>
                <month>01</month>
                <year>2012</year>
            </pub-date>
            <volume>14</volume>
            <issue>1</issue>
            <elocation-id>e22</elocation-id>
            <!--history from ojs - api-xml-->
            <history>
                <date date-type="received">
                    <day>06</day>
                    <month>11</month>
                    <year>2011</year>
                </date>
                <date date-type="rev-request">
                    <day>27</day>
                    <month>11</month>
                    <year>2011</year>
                </date>
                <date date-type="rev-recd">
                    <day>16</day>
                    <month>01</month>
                    <year>2012</year>
                </date>
                <date date-type="accepted">
                    <day>17</day>
                    <month>01</month>
                    <year>2012</year>
                </date>
            </history>
            <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
            <copyright-statement>&#169;Luis Fernandez-Luque, Randi Karlsen, Genevieve B Melton. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 31.01.2012. </copyright-statement>
            <copyright-year>2012</copyright-year>
            <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
                <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
            </license>
            <self-uri xlink:href="http://www.jmir.org/2012/1/e22/" xlink:type="simple" />
            <abstract>
                <sec sec-type="background">
                    <title>Background</title>
                    <p>Social media are becoming mainstream in the health domain. Despite the large volume of accurate and trustworthy health information available on social media platforms, finding good-quality health information can be difficult. Misleading health information can often be popular (eg, antivaccination videos) and therefore highly rated by general search engines. We believe that community wisdom about the quality of health information can be harnessed to help create tools for retrieving good-quality social media content.</p>
                </sec>
                <sec>
                    <title>Objectives</title>
                    <p>To explore approaches for extracting metrics about authoritativeness in online health communities and how these metrics positively correlate with the quality of the content.</p>
                </sec>
                <sec sec-type="methods">
                    <title>Methods</title>
                    <p>We designed a metric, called HealthTrust, that estimates the trustworthiness of social media content (eg, blog posts or videos) in a health community. The HealthTrust metric calculates reputation in an online health community based on link analysis. We used the metric to retrieve YouTube videos and channels about diabetes. In two different experiments, health consumers provided 427 ratings of 17 videos and professionals gave 162 ratings of 23 videos. In addition, two professionals reviewed 30 diabetes channels.</p>
                </sec>
                <sec sec-type="results">
                    <title>Results</title>
                    <p>HealthTrust may be used for retrieving online videos on diabetes, since it performed better than YouTube Search in most cases. Overall, of 20 potential channels, HealthTrust&#8217;s filtering allowed only 3 bad channels (15%) versus 8 (40%) on the YouTube list. Misleading and graphic videos (eg, featuring amputations) were more commonly found by YouTube Search than by searches based on HealthTrust. However, some videos from trusted sources had low HealthTrust scores, mostly from general health content providers, and therefore not highly connected in the diabetes community. When comparing video ratings from our reviewers, we found that HealthTrust achieved a positive and statistically significant correlation with professionals (Pearson <italic>r</italic>
                        <sub>10</sub> = .65, <italic>P</italic> = .02) and a trend toward significance with health consumers (<italic>r</italic>
                        <sub>7</sub> = .65, <italic>P</italic> = .06) with videos on hemoglobinA<sub>1</sub>
                        <sub>c</sub>, but it did not perform as well with diabetic foot videos.</p>
                </sec>
                <sec sec-type="conclusions">
                    <title>Conclusions</title>
                    <p>The trust-based metric HealthTrust showed promising results when used to retrieve diabetes content from YouTube. Our research indicates that social network analysis may be used to identify trustworthy social media in health communities.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>Medical informatics</kwd>
                <kwd>information storage and retrieval</kwd>
                <kwd>video</kwd>
                <kwd>online systems</kwd>
                <kwd>health communication</kwd>
                <kwd>diabetes</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title>Introduction</title>
            <p>The Internet is emerging as one of the main sources of consumer health information [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Many health authorities, medical associations, hospitals, and patients have published or are publishing online content, including through social media platforms (eg, blogs, YouTube, or Twitter). Kaplan and Haenlein defined social media as consisting of a &#8220;set of Web applications, which allows the creation and exchange of user-generated content&#8221; [<xref ref-type="bibr" rid="ref3">3</xref>]. Social media are becoming increasingly mainstream in the health domain [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. For example, there are more than 500 channels on YouTube created by American hospitals, containing thousands of videos [<xref ref-type="bibr" rid="ref7">7</xref>]. Similarly, the United Kingdom&#8217;s National Health Service has published more than 500 videos on YouTube [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
            <p>Despite the large volume of good-quality health information available on social media platforms, finding accurate and trustworthy health information can be surprisingly difficult [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref13">13</xref>]. There is a great deal of misinformation, and one often comes across content promoting anorexia or avoiding vaccinations [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. Sometimes bogus health information can become extremely popular and viral (eg, conspiracy theories about vaccination). Therefore, sifting through this to find trustworthy health information remains one of the main challenges faced by health consumers.</p>
            <p>In conjunction with the large quantity of information, many health consumers rely on online communities for relevant information. Indeed, online health communities have been found to be very effective in filtering misleading information [<xref ref-type="bibr" rid="ref16">16</xref>]. Members of online communities have to build their trust gradually, which makes it hard for sources that are not trusted to disseminate misinformation. It is also possible to ask peers about high-quality health information; however, peers are not available all the time and often cannot provide instant feedback.</p>
            <p>The objective of this study was to explore approaches for extracting metrics about authoritativeness in online health communities and how these metrics would positively correlate with the quality of the content. An authoritative member of the community (such as the American Diabetes Association) tends to publish or endorse content of better quality than do nonauthoritative members of the community. Using link-based analysis, we extracted a metric (called HealthTrust) about authoritativeness in a health community. We then implemented an algorithm for searching videos and channels based on HealthTrust and tested it with online diabetes content from YouTube.</p>
            <sec>
                <title>Background</title>
                <p>Outside of the health domain, human experts are rarely used in any scalable fashion for classifying and retrieving webpages. Web information retrieval systems rely on automatic approaches to harvest reputable online resources, mainly based on the analysis of links between pages [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. In Google&#8217;s PageRank, links from one site to another can be modeled as an endorsement, and they are used to calculate a global rank of all the websites [<xref ref-type="bibr" rid="ref18">18</xref>]. Another example is the hyperlink-induced topic search (HITS) algorithm [<xref ref-type="bibr" rid="ref17">17</xref>]. As explained in the following section, HITS is a link analysis algorithm for ranking webpages based on two scores: authoritativeness and hubs. Hubs are essentially webpages that function as directories that have links to authoritative pages. The authorities are webpages that are linked by many of the most representative Webs, so they have a high authoritativeness within the community of Webs. Other algorithms, such as TrustRank, take into account trustworthiness in online communities, aimed at making the search more robust to Web spam [<xref ref-type="bibr" rid="ref20">20</xref>]. Gou et al explored how to use social network analysis for ranking online videos in a personalized manner [<xref ref-type="bibr" rid="ref21">21</xref>]. Mislove et al studied the integration of general-purpose social networks with online Web searches [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
                <p>To our knowledge none of those algorithms have been studied in the health domain. One of the main challenges in the health domain is that misleading health information can be very popular (eg, antivaccination videos) and therefore may be paradoxically highly rated and not considered spam by general information retrieval algorithms.</p>
                <p>Health consumers need tailored tools to help them find good-quality health social media and websites. A common approach consists in creating quality labels for trustworthy health websites that adhere to a set of guidelines [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Some studies have pointed out cases where those guidelines were not that effective for finding good health information [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. Another difficulty is choosing among dozens of guidelines [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. These guidelines have been combined with automatic approaches that extract certain quality indicators [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref28">28</xref>] used for online health information retrieval. However, automatic approaches are still not widely used. To our knowledge, none of these projects focus on link-based analysis and trust metrics of health websites, as generic search engines do. In addition, despite the popularity of health videos, we have not come across any project specifically aimed at developing tools to help find relevant health videos.</p>
            </sec>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <p>In the next subsection, we describe the metric HealthTrust and how it can be integrated to enhance the search of social media content (ie, YouTube diabetes videos). In the subsequent subsections, we describe two studies aimed at evaluating the relationship between the HealthTrust scores of diabetes videos and channels, and their quality as perceived by end users. We designed these experiments to evaluate our hypothesis that HealthTrust&#8217;s metric can be used to improve the retrieval of health social media. In the first study, we evaluated the use of HealthTrust for filtering diabetes channels from YouTube. In a second study, we evaluated the correlation between HealthTrust scores and ratings of videos about diabetes <italic>A</italic>
                <italic>1</italic>
                <italic>c test</italic>
                <italic>ing</italic> and <italic>diabetic foot</italic>.</p>
            <sec>
                <title>HealthTrust</title>
                <p>According to the Merriam Webster Dictionary, trust is an &#8220;assured reliance on the character, ability, strength, or truth of someone or something&#8221; [<xref ref-type="bibr" rid="ref29">29</xref>]. Other related terms, treated as equivalent to <italic>trust</italic>, are <italic>authoritativeness</italic> (&#8220;clearly accurate or knowledgeable&#8221; [<xref ref-type="bibr" rid="ref30">30</xref>]) and <italic>reputation</italic> (&#8220;overall quality or character as seen or judged by people in general&#8221; [<xref ref-type="bibr" rid="ref31">31</xref>]). In the Web information retrieval domain, trust has normally been based on the analysis of link structures. A link from one website to another implies an endorsement of the linked website; this approach is very similar to the calculation of impact factors for journals. Trust in the health domain is mainly related to the concept of authoritativeness in terms of the reliability and knowledge of the content creator. There are, however, many additional aspects related to trust such as <italic>appearance</italic> and <italic>impartiality</italic> [<xref ref-type="bibr" rid="ref32">32</xref>]. Within the scope of this study, we define trust as the &#8220;assured reliance on the quality of users and content within an online health community.&#8221;</p>
                <p>As we mentioned in the introduction, online health communities can be effective in filtering out misleading health information [<xref ref-type="bibr" rid="ref16">16</xref>]. Users disseminating misleading information have a hard job gaining trust within the community. A user creating videos about herbal cures for diabetes will receive less endorsement from the diabetes community than a video created by the American Diabetes Association.</p>
                <p>We assume that misleading information will be less endorsed within the health community. Consequently, trustworthiness within the health community will correlate with higher content quality. To compute the trustworthiness of health social media, we designed an algorithm to calculate a metric, called HealthTrust, that estimates the trustworthiness of social media content (eg, blog post or video) in the health community to which it belongs. To evaluate HealthTrust we designed an algorithm for searching online health videos based on that metric.</p>
                <sec>
                    <title>HealthTrust Metric</title>
                    <p>Users and content are heavily interconnected in the context of health social media. <xref ref-type="fig" rid="figure1">Figure 1</xref> shows that links between users and content form a graph that models a social network where it is possible to calculate trust-related metrics. Content and users are interconnected and can form a health community with a common interest (eg, diabetes).</p>
                    <p>HealthTrust (<xref ref-type="fig" rid="figure2">Figure 2</xref>) is a metric about trust of content and members of a health community. Trust can be modeled for both users (&#8220;I trust this author&#8221;) and content (&#8220;I trust this content&#8221;). In fact, your trust in a particular piece of content should be a combination of how much you trust its author and the content itself. Based on these considerations we designed the HealthTrust metric. To calculate HealthTrust a set of steps must be followed: (1) extraction of the community where HealthTrust is going to be applied, (2) calculation of the authoritativeness scores for content and users based on their links, and (3) calculation of HealthTrust scores. Finally, this score can be used for information retrieval purposes as explained in the subsection &#8220;HealthTrust for Search.&#8221;</p>
                    <fig id="figure1" position="float">
                        <label>Figure 1</label>
                        <caption>
                            <p>Example of a health social network.</p>
                        </caption>
                        <graphic xlink:href="jmir_v14i1e22_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                    <fig id="figure2" position="float">
                        <label>Figure 2</label>
                        <caption>
                            <p>Calculation of the HealthTrust content score.</p>
                        </caption>
                        <graphic xlink:href="jmir_v14i1e22_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                    <sec>
                        <title>Community Extraction</title>
                        <p>HealthTrust is applied to only a certain health community. That community can be identified by many different means, such as manual selection of users and heuristic approaches [<xref ref-type="bibr" rid="ref33">33</xref>]. As explained in the following section, in our study we extracted YouTube users interested in diabetes by using different search queries related to diabetes. Community extraction is a core aspect in HealthTrust, since the metric is not calculating the general authoritativeness of the content but rather the authoritativeness in a particular community. In the case of YouTube in general, MTV videos from rock stars may be more authoritative than videos from health agencies such as the US Centers for Disease Control and Prevention (CDC). On the contrary, with HealthTrust the focus is on intracommunity authoritativeness. For example, in the health community the CDC is far more authoritative than MTV.</p>
                        <p>For our case study we used the diabetes community on the online video-sharing platform YouTube. As shown on <xref ref-type="fig" rid="figure3">Figure 3</xref>, YouTube can be modeled as a social network where users (ie, channels) can build their reputation using different social links (eg, subscriptions, friendships, favorite videos, or comments) [<xref ref-type="bibr" rid="ref34">34</xref>]. In our study, we took into consideration favorite videos and subscriptions, since these links are the most commonly used by all members of the community.</p>
                        <p>In our first study we used the YouTube application programming interface (API) to search all the channels that had the keyword <italic>diabetes</italic> and extracted all the accessible information about them (eg, uploads, subscriptions, and favorites). In our second study, we extracted community searches for videos using a set of diabetes-related queries. We extracted all the information about these videos and their authors.</p>
                        <fig id="figure3" position="float">
                            <label>Figure 3</label>
                            <caption>
                                <p>YouTube’s social network. CDC = Centers for Disease Control and Prevention.</p>
                            </caption>
                            <graphic xlink:href="jmir_v14i1e22_fig3.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                        </fig>
                    </sec>
                    <sec>
                        <title>Authoritativeness Scores</title>
                        <p>The authoritativeness scores in HealthTrust can be calculated using link-based metrics such as PageRank scores [<xref ref-type="bibr" rid="ref18">18</xref>] or HITS authoritativeness [<xref ref-type="bibr" rid="ref17">17</xref>]. As explained in the next section, in our study we used the HITS authoritativeness score. In these algorithms, the links between websites are used to model a bidirectional graph with incoming and outgoing links. A recursive algorithm is used to score the reputation of a website based on the incoming links, since an incoming link is considered an endorsement of the linked website. The HITS algorithm considers two types of nodes: authorities and hubs. The hubs are the nodes that tend to link to the most authoritative webpages. The authoritative scores in HITS are calculated based on the incoming links from hubs.</p>
                        <p>The authoritativeness of content and users are calculated as follows. First, the authoritativeness of content (<xref ref-type="fig" rid="figure4">Figure 4</xref>, left) is calculated based on the links between all users and content. Both content and users are considered nodes. Second, the authoritativeness of users (<xref ref-type="fig" rid="figure4">Figure 4</xref>, right) is calculated based on the links between all users, which are the only nodes. If a user likes or favors content from another user, this is considered as a link between the users.</p>
                        <p>In our study we used the Java Universal Network/Graph (JUNG) API [<xref ref-type="bibr" rid="ref35">35</xref>] to calculate the HITS authoritativeness values of users (ie, channels) and content (videos) as follows. First, for the authoritativeness of users, we created a graph where the nodes were the channels and the edges were their subscriptions (channel X subscribed to channel Y) and favorites (channel X subscribed to video of channel Y). Then, that graph was used to calculate the HITS authoritativeness values of the channels. Second, for the authoritativeness scores of videos, we considered videos and channels to be nodes and the edges to be favorites (channel X subscribed to video Z) and subscriptions (channel X subscribed to video of channel Y). That graph was used to calculate the HITS authoritativeness values of the videos.</p>
                        <p>The authoritativeness values for content and users are calculated independently as shown in the <xref ref-type="fig" rid="figure4">Figure 4</xref>. Therefore, to combine them it is necessary to normalize their ranges&#8212;for example, in our study we normalized the authoritativeness scores of videos and users between 0 and 1.</p>
                        <fig id="figure4" position="float">
                            <label>Figure 4</label>
                            <caption>
                                <p>Links (in blue) used to calculate authoritativeness of users (left) and content (right). Diagram based on <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p>
                            </caption>
                            <graphic xlink:href="jmir_v14i1e22_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                        </fig>
                    </sec>
                    <sec>
                        <title>Calculation of HealthTrust</title>
                        <p>The HealthTrust score of a particular piece of content (eg, video or blog post) is the weighted combination of the normalized authoritativeness scores of content. The weighted combination is based on the InheritanceFactor. The weighted approach is designed to allow part of the trustworthiness to be inherited by the content from its author. Thus, new content from a trusted author will have a higher HealthTrust score than new content from an untrustworthy author. To give a high weight to the InheritanceFactor implies that the authoritativeness of the author is very important. For example, a video from the CDC will have implicit authoritativeness even if it is new and has never been rated or linked. An InheritanceFactor of 0 implies that there is no inheritance transfer of trust from the authors to their content, so all the authoritativeness is based on the video&#8217;s score.</p>
                        <p>As <xref ref-type="fig" rid="figure5">Figure 5</xref> shows, in the video study authoritativeness scores were combined with an InheritanceFactor of 0.7, meaning that the HITS authoritative value of videos weighed 30% and the author&#8217;s authoritativeness 70%. We decided on these values after testing with several queries (not used in our evaluation) in a previous data set. We observed that there were many new high-quality videos without links to them, so a lower value for the InheritanceFactor would have decreased their HealthTrust despite being from a trusted content provider.</p>
                        <fig id="figure5" position="float">
                            <label>Figure 5</label>
                            <caption>
                                <p>HealthTrust calculation for diabetes videos from YouTube.</p>
                            </caption>
                            <graphic xlink:href="jmir_v14i1e22_fig5.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                        </fig>
                    </sec>
                </sec>
                <sec>
                    <title>HealthTrust for Search</title>
                    <p>We believe that HealthTrust can be used to enhance the retrieval of content within health communities. To evaluate that possibility we designed a search algorithm that combines query matching with HealthTrust. Our search algorithm is based on combining two scores: (1) relevance of the content to the search query, and (2) HealthTrust. Relevance can be calculated using simple query matching (eg, the content contains the query in its title or in the description).</p>
                    <p>We implemented a search algorithm based on HealthTrust to study whether that metric may be use to retrieve diabetes videos. As shown in <xref ref-type="fig" rid="figure6">Figure 6</xref>, our search algorithm combined the syntactic query match with the HealthTrust values. If the query matched the video&#8217;s title the relevance was computed as 100% of the video&#8217;s HealthTrust score. If the query only matched the description, the relevance was computed as 20% of the video&#8217;s HealthTrust score. We decided on these values after observing the quality of video metadata. In particular, we observed that titles are very important to infer the relevance of videos, since descriptions and tags tend to be very heterogeneous (eg, due to tag spamming). In a previous study, we also found that the quality of comments on YouTube health videos can be very heterogeneous [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
                    <fig id="figure6" position="float">
                        <label>Figure 6</label>
                        <caption>
                            <p>Relevance calculation for HealthTrust-based search.</p>
                        </caption>
                        <graphic xlink:href="jmir_v14i1e22_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                </sec>
            </sec>
            <sec>
                <title>Study: Diabetes Channels and HealthTrust</title>
                <p>As described in a previous report [<xref ref-type="bibr" rid="ref37">37</xref>], in May 2010, we performed a study to evaluate the feasibility of using social network analysis to filter YouTube diabetes channels. The objective of this study was to test whether the authoritativeness values of the diabetes channels in YouTube are related to their quality.</p>
                <sec>
                    <title>Data Collection</title>
                    <p>
                        <xref ref-type="fig" rid="figure7">Figure 7</xref> describes how we extracted 5133 videos, 219 channels, 182 favorites, and 247 friendships about diabetes from YouTube using the YouTube API. We searched channels with the query <italic>diabetes</italic> and extracted their information (links, videos, descriptions, etc) to calculate their HealthTrust scores, which corresponded to the authoritativeness values of the channels, since we did not take videos into consideration in this study.</p>
                    <fig id="figure7" position="float">
                        <label>Figure 7</label>
                        <caption>
                            <p>Data extraction in the study of diabetes channels and HealthTrust. API = application programming interface; HITS = hyperlink-induced topic search.</p>
                        </caption>
                        <graphic xlink:href="jmir_v14i1e22_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                </sec>
                <sec>
                    <title>Recruitment and Ratings</title>
                    <p>Two health care professionals rated channels from a list containing the top 20 diabetes channels retrieved by YouTube and HealthTrust&#8217;s top 20 channels. The reviewers received a list with all the channels alphabetically ordered and were asked to respond with &#8220;yes&#8221; or &#8220;no&#8221; to whether they would recommend the diabetes channel to a patient with diabetes.</p>
                    <p>The interrated agreement score based on Cohen kappa [<xref ref-type="bibr" rid="ref38">38</xref>] was calculated using the statistical framework R [<xref ref-type="bibr" rid="ref39">39</xref>] and resulted in good agreement (.61).</p>
                </sec>
                <sec>
                    <title>Data Analysis</title>
                    <p>We evaluated the results using the precision at K metric [<xref ref-type="bibr" rid="ref40">40</xref>], with K being the top-ranked retrieved results. This technique is used widely to evaluate Web search engines, since users tend to use only the top search results. We also evaluated the results with the metric discounted cumulative gain (DCG). DCG is commonly used to evaluate ranked lists of Web search results taking into account the position of the retrieved results [<xref ref-type="bibr" rid="ref41">41</xref>]. The relevance <italic>gain</italic> decreases logarithmically based on the position of the retrieved results.</p>
                </sec>
            </sec>
            <sec>
                <title>Search Study: Diabetes Videos and HealthTrust</title>
                <sec>
                    <title>Data Collection</title>
                    <p>In April 2011, we collected from YouTube 8087 diabetes videos using the search API with 20 different queries (<italic>diabetic foot</italic>, <italic>diabetes</italic>, <italic>diabetes ketoacidosis</italic>, etc) as explained in <xref ref-type="fig" rid="figure8">Figure 8</xref>. We also extracted all the available information about channels, subscriptions, and favorites. Finally, we calculated the HealthTrust scores for videos and channels.</p>
                    <p>Although our dataset contained videos found by different queries, we evaluated videos from only two queries in order to increase the number of responses per video. We limited our study to the evaluation of searches about two information needs that are important for most people affected by diabetes: diabetes foot issues and hemoglobin A<sub>1</sub>
                        <sub>c</sub> (glycated hemoglobin) testing. Diabetes foot problems are very common among people with diabetes and require a lot of attention to avoid very serious complications that can lead to amputation. Diabetes hemoglobin A<sub>1c</sub> testing is a very common laboratory test to evaluate how well the diabetes is managed.</p>
                    <p>Most of the responders rated different videos, since there were four different lists and some of the surveys were not completely filled out. Therefore, there was not enough data to calculate a meaningful interannotator agreement score in this study. For each type of responder (professionals and consumers), we aggregated the ratings of the different videos and calculated the average rating values.</p>
                    <fig id="figure8" position="float">
                        <label>Figure 8</label>
                        <caption>
                            <p>Data extraction on the search study on diabetes videos and HealthTrust. API = application programming interface; HITS = hyperlink-induced topic search.</p>
                        </caption>
                        <graphic xlink:href="jmir_v14i1e22_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                </sec>
                <sec>
                    <title>Recruitment</title>
                    <p>After extracting the dataset of diabetes videos we recruited professionals and health consumers to evaluate the results. The recruitment took place between April 25 and June 14, 2011.</p>
                    <p>We recruited health care professional reviewers using a snowball approach, where invitations were sent to professional mailing lists. We collected 82 informed consents, and 27 video surveys were completed (2 surveys were removed due to the lack of information about the profession of the respondents). In total, professionals provided 162 ratings of 23 videos.</p>
                    <p>We recruited health consumers from the online diabetes community TuDiabetes.org, which has more than 20,000 members. Information about the study was posted on the community&#8217;s main blog and in their mailing list (about 10,000 subscribers). We received 178 informed consents, and 73 surveys were partially or completely filled in. In total, consumers provided 427 ratings of 17 videos. A donation of US $5 per survey was given to the Diabetes Hands Foundation, which runs the online community.</p>
                </sec>
                <sec>
                    <title>Video Surveys</title>
                    <p>We evaluated the top 7 video search results for the queries <italic>diabetic foot</italic> and <italic>diabetes A</italic>
                        <italic>1</italic>
                        <italic>c</italic> using both HealthTrust and YouTube search (ordered by relevance). As depicted in <xref ref-type="fig" rid="figure9">Figure 9</xref>, after providing informed consent in a Web form the respondents were randomly assigned to a survey with videos to review. Respondents were not informed about the algorithm used to select the videos.</p>
                    <p>Professional reviewers were assigned to one of four different surveys: two about diabetic foot (one based on YouTube and the other on HealthTrust) and two for hemoglobin A<sub>1</sub>
                        <sub>c</sub> testing. The two lists about diabetic foot for professionals contained 11 videos and the lists about hemoglobin A<sub>1</sub>
                        <sub>c</sub> testing contained 12 videos. Health consumers were assigned to lists for the same queries, but the listed videos were limited to those published by a whitelist of trusted sources. The main reason for using a whitelist was to avoid showing misleading and disturbing videos to consumers (eg, videos featuring amputations). These lists for health consumers contained a total of 17 videos, 8 about diabetic foot and 9 about hemoglobin A<sub>1</sub>
                        <sub>c</sub> testing.</p>
                    <p>Professionals and health consumers were asked to respond to the following questions about the videos with a Likert scale (eg, from strongly agree to strongly disagree): &#8220;Would you recommend this video to a patient with diabetes and questions about diabetic foot?&#8221; (question for professionals for a video from the list about diabetic foot); and &#8220;Do you like this video about diabetic foot?&#8221; (question for health consumers for a video from the list about diabetic foot).</p>
                    <fig id="figure9" position="float">
                        <label>Figure 9</label>
                        <caption>
                            <p>Process of obtaining informed consent from health care professionals and health consumers, and survey allocation.</p>
                        </caption>
                        <graphic xlink:href="jmir_v14i1e22_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                    </fig>
                </sec>
                <sec>
                    <title>Data Analysis</title>
                    <p>We evaluated the retrieved results using the metrics precision at K [<xref ref-type="bibr" rid="ref40">40</xref>] and DCG [<xref ref-type="bibr" rid="ref41">41</xref>]. However, we did not calculate either of these metrics for the health consumers, as they had a prefiltered dataset.</p>
                    <p>In addition, we used the Pearson correlation [<xref ref-type="bibr" rid="ref42">42</xref>] to study the correlation between the HealthTrust scores and the average ratings. Pearson correlation is commonly used to study linear dependence between two variables, and the correlation coefficient ranges from &#8722;1 to 1. The Pearson correlation was calculated using the psych package of statistical framework R [<xref ref-type="bibr" rid="ref39">39</xref>].</p>
                </sec>
            </sec>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <sec>
                <title>Study of Diabetes Channels</title>
                <p>The first study was designed to evaluate the feasibility of using the HealthTrust metric to filter YouTube diabetes channels (aka users). We studied precision at K (K = 5, K = 10, and K = 20) in the top 20 diabetes channels retrieved by the YouTube- and HealthTrust-based searches.</p>
                <p>We proposed two possible scenarios for considering a channel relevant: (1) both reviewers recommended the channel and, (2) at least one reviewer recommended the channel. <xref ref-type="table" rid="table1">Table 1</xref> shows that the search based on HealthTrust scores performed better than YouTube search in all cases and was only equally good for precision at K = 5 and for channels recommended by both reviewers. The DCG evaluation (<xref ref-type="table" rid="table2">Table 2</xref>) also resulted in better scores for HealthTrust than for YouTube searches.</p>
                <table-wrap id="table1" position="float">
                    <label>Table 1</label>
                    <caption>
                        <p> Evaluation of the top 20 diabetes channels by precision at K metric</p>
                    </caption>
                    <table cellpadding="8" cellspacing="0" border="1" rules="groups" frame="hsides" width="1000">
                        <col width="223" />
                        <col width="97" />
                        <col width="97" />
                        <col width="97" />
                        <col width="97" />
                        <col width="97" />
                        <col width="97" />
                        <col width="97" />
                        <col width="97" />
                        <thead>
                            <tr valign="top">
                                <td rowspan="3">  Recommended by/precision at K  </td>
                                <td colspan="4">  Both reviewers  </td>
                                <td colspan="4">  At least one reviewer  </td>
                            </tr>
                            <tr valign="top">
                                <td colspan="2">  YouTube  </td>
                                <td colspan="2">  HealthTrust  </td>
                                <td colspan="2">  YouTube  </td>
                                <td colspan="2">  HealthTrust  </td>
                            </tr>
                            <tr valign="top">
                                <td>  n  </td>
                                <td>  %  </td>
                                <td>  n  </td>
                                <td>  %  </td>
                                <td>  n  </td>
                                <td>  %  </td>
                                <td>  n  </td>
                                <td>  %  </td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>  K = 5  </td>
                                <td>  4  </td>
                                <td>  80%  </td>
                                <td>  4  </td>
                                <td>  80%  </td>
                                <td>  4  </td>
                                <td>  80%  </td>
                                <td>  5  </td>
                                <td>  100%  </td>
                            </tr>
                            <tr valign="top">
                                <td>  K = 10  </td>
                                <td>  6  </td>
                                <td>  60%  </td>
                                <td>  7  </td>
                                <td>  70%  </td>
                                <td>  7  </td>
                                <td>  70%  </td>
                                <td>  9  </td>
                                <td>  90%  </td>
                            </tr>
                            <tr valign="top">
                                <td>  K = 20  </td>
                                <td>  10  </td>
                                <td>  50%  </td>
                                <td>  13  </td>
                                <td>  65%  </td>
                                <td>  12  </td>
                                <td>  60%  </td>
                                <td>  17  </td>
                                <td>  85%  </td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap id="table2" position="float">
                    <label>Table 2</label>
                    <caption>
                        <p> Evaluation of the top 20 diabetes channels by discounted cumulative gain (DCG) metric</p>
                    </caption>
                    <table cellpadding="8" cellspacing="0" border="1" rules="groups" frame="hsides" width="1000">
                        <col width="227" />
                        <col width="174" />
                        <col width="213" />
                        <col width="174" />
                        <col width="213" />
                        <thead>
                            <tr valign="top">
                                <td rowspan="2">  Recommended by/DCGi<sup>a</sup>
                                </td>
                                <td colspan="2">  Both reviewers  </td>
                                <td colspan="2">  At least one reviewer  </td>
                            </tr>
                            <tr valign="top">
                                <td>  YouTube  </td>
                                <td>  HealthTrust  </td>
                                <td>  YouTube  </td>
                                <td>  HealthTrust  </td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>  i = 5  </td>
                                <td>  2.9  </td>
                                <td>  3.1  </td>
                                <td>  2.9  </td>
                                <td>  3.6  </td>
                            </tr>
                            <tr valign="top">
                                <td>  i = 10  </td>
                                <td>  3.6  </td>
                                <td>  4.1  </td>
                                <td>  4  </td>
                                <td>  4.9  </td>
                            </tr>
                            <tr valign="top">
                                <td>  i = 20  </td>
                                <td>  4.6  </td>
                                <td>  5.7  </td>
                                <td>  5.3  </td>
                                <td>  7  </td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <fn id="table2fn1">
                            <p>
                                <sup>a</sup> i = number of retrieved videos.</p>
                        </fn>
                    </table-wrap-foot>
                </table-wrap>
                <p>To consider and analyze the capacity of the algorithms to filter out bad content or spam, we considered a channel to be misleading if none of the reviewers recommended it. HealthTrust&#8217;s approach performed quite well, filtering out bad channels. For K = 20, HealthTrust&#8217;s list had only 3 bad channels (15%) versus 8 (40%) on the YouTube list. In the top 10 channels, HealthTrust had only 1 bad channel (10%) versus 3 (30%) for YouTube. Within the top 5 channels, all HealthTrust&#8217;s channels were recommended by at least one reviewer, one more than YouTube.</p>
                <p>In the YouTube top 20, some channels featured commercials of diabetes products (eg, testing supplies), several were about a famous diabetic singer (Jonas), and one channel was in Dutch (even though we restricted the search to English in the API). The YouTube list also contained some channels with the word diabetes in its name, but most of the videos were not related to diabetes.</p>
                <p>The HealthTrust list did not contain any channels with advertising, but it did have some channels from e-patients with very heterogeneous quality. Surprisingly, some diabetes channels run by public authorities, such as the Juvenile Diabetes Research Foundation, were not highly ranked in HealthTrust. The most logical explanation for this is that some relevant channels do not encourage social interactions (eg, friendships or subscriptions), and this less-connected nature may decrease their rankings.</p>
            </sec>
            <sec>
                <title>Study of Diabetes Videos</title>
                <p>In the second study, we explored how the HealthTrust metric can be used to retrieve diabetes videos and also the correlation between HealthTrust and the video&#8217;s ratings.</p>
                <sec>
                    <title>HealthTrust Search Evaluation</title>
                    <p>We calculated precision at K for the list created for professionals to evaluate the performance of the search algorithm. However, we did not study precision at K for consumers, since the dataset was prefiltered.</p>
                    <p>Precision at K (K = 3, K = 7) for the professionals&#8217; lists was considered as a video rating equal to or greater than 3.5 (values range from 1 to 5). As shown in <xref ref-type="table" rid="table3">Table 3</xref>, precision was better in HealthTrust for both the diabetes A<sub>1c</sub> and diabetic foot lists. In the case of diabetic foot, the YouTube list precision was below 50% for both the top 7 and the top 3. The HealthTrust-based search also performed better based on the DCG metric (<xref ref-type="table" rid="table4">Table 4</xref>).</p>
                    <table-wrap id="table3" position="float">
                        <label>Table 3</label>
                        <caption>
                            <p> Precision at K for videos evaluated by professionals retrieved by HealthTrust and YouTube</p>
                        </caption>
                        <table cellpadding="8" cellspacing="0" border="1" rules="groups" frame="hsides" width="1000">
                            <col width="154" />
                            <col width="106" />
                            <col width="106" />
                            <col width="106" />
                            <col width="106" />
                            <col width="106" />
                            <col width="106" />
                            <col width="106" />
                            <col width="106" />
                            <thead>
                                <tr valign="top">
                                    <td rowspan="3">  Precision at K  </td>
                                    <td colspan="4">  Hemoglobin A<sub>1c</sub>
                                    </td>
                                    <td colspan="4">  Diabetic foot  </td>
                                </tr>
                                <tr valign="top">
                                    <td colspan="2">  YouTube  </td>
                                    <td colspan="2">  HealthTrust  </td>
                                    <td colspan="2">  YouTube  </td>
                                    <td colspan="2">  HealthTrust  </td>
                                </tr>
                                <tr valign="top">
                                    <td>  n  </td>
                                    <td>  %  </td>
                                    <td>  n  </td>
                                    <td>  %  </td>
                                    <td>  n  </td>
                                    <td>  %  </td>
                                    <td>  n  </td>
                                    <td>  %  </td>
                                </tr>
                            </thead>
                            <tbody>
                                <tr valign="top">
                                    <td>  K = 3  </td>
                                    <td>  2  </td>
                                    <td>  66%  </td>
                                    <td>  3  </td>
                                    <td>  100%  </td>
                                    <td>  1  </td>
                                    <td>  33%  </td>
                                    <td>  2  </td>
                                    <td>  66%  </td>
                                </tr>
                                <tr valign="top">
                                    <td>  K = 7  </td>
                                    <td>  4  </td>
                                    <td>  57%  </td>
                                    <td>  5  </td>
                                    <td>  70%  </td>
                                    <td>  3  </td>
                                    <td>  43%  </td>
                                    <td>  4  </td>
                                    <td>  57%  </td>
                                </tr>
                            </tbody>
                        </table>
                    </table-wrap>
                    <table-wrap id="table4" position="float">
                        <label>Table 4</label>
                        <caption>
                            <p> Discounted cumulative gain (DCG) for videos evaluated by professionals retrieved by HealthTrust and YouTube</p>
                        </caption>
                        <table cellpadding="8" cellspacing="0" border="1" rules="groups" frame="hsides" width="1000">
                            <col width="145" />
                            <col width="192" />
                            <col width="235" />
                            <col width="192" />
                            <col width="235" />
                            <thead>
                                <tr valign="top">
                                    <td rowspan="2">  DCGi<sup>a</sup>
                                    </td>
                                    <td colspan="2">  Hemoglobin A<sub>1</sub>
                                        <sub>c</sub>
                                    </td>
                                    <td colspan="2">  Diabetic foot  </td>
                                </tr>
                                <tr valign="top">
                                    <td>  YouTube  </td>
                                    <td>  HealthTrust  </td>
                                    <td>  YouTube  </td>
                                    <td>  HealthTrust  </td>
                                </tr>
                            </thead>
                            <tbody>
                                <tr valign="top">
                                    <td>  i = 3  </td>
                                    <td>  1.6  </td>
                                    <td>  2.6  </td>
                                    <td>  1  </td>
                                    <td>  2  </td>
                                </tr>
                                <tr valign="top">
                                    <td>  i = 7  </td>
                                    <td>  2,6  </td>
                                    <td>  3.4  </td>
                                    <td>  1.9  </td>
                                    <td>  2.9  </td>
                                </tr>
                            </tbody>
                        </table>
                        <table-wrap-foot>
                            <fn id="table4fn1">
                                <p>
                                    <sup>a</sup> i = number of retrieved videos.</p>
                            </fn>
                        </table-wrap-foot>
                    </table-wrap>
                </sec>
                <sec>
                    <title>HealthTrust and Rating Correlation</title>
                    <p>The study of the correlation between HealthTrust score and average rating was used to determine whether our trustworthiness score had a positive impact on the ratings.</p>
                    <p>For both professionals and consumers, we created two subsets with the videos of each topic (hemoglobin A<sub>1</sub>
                        <sub>c</sub> testing and diabetic foot). We normalized the average ratings of the videos between 0 and 1 for the subset with the videos about hemoglobin A<sub>1</sub>
                        <sub>c</sub> testing and the subset about diabetic foot. Similarly, we normalized the HealthTrust scores within each subset. As shown in <xref ref-type="table" rid="table5">Table 5</xref>, we compared average ratings and HealthTrust scores for each subset using the Pearson correlation (alpha = .05).</p>
                    <table-wrap id="table5" position="float">
                        <label>Table 5</label>
                        <caption>
                            <p> Pearson correlation between ratings and HealthTrust</p>
                        </caption>
                        <table cellpadding="8" cellspacing="0" border="1" rules="groups" frame="hsides" width="1000">
                            <col width="269" />
                            <col width="206" />
                            <col width="160" />
                            <col width="206" />
                            <col width="160" />
                            <thead>
                                <tr valign="top">
                                    <td rowspan="2" />
                                    <td colspan="2">  Hemoglobin A<sub>1</sub>
                                        <sub>c</sub>
                                    </td>
                                    <td colspan="2">  Diabetic foot  </td>
                                </tr>
                                <tr valign="top">
                                    <td>  Pearson <italic>r</italic>
                                    </td>
                                    <td>
                                        <italic>P</italic> value  </td>
                                    <td>  Pearson <italic>r</italic>
                                    </td>
                                    <td>
                                        <italic>P</italic> value  </td>
                                </tr>
                            </thead>
                            <tbody>
                                <tr valign="top">
                                    <td>  Professionals  </td>
                                    <td>
                                        <italic>r</italic>
                                        <sub>10</sub> = .646  </td>
                                    <td>  .02  </td>
                                    <td>
                                        <italic>r</italic>
                                        <sub>9</sub> = .275  </td>
                                    <td>  .41  </td>
                                </tr>
                                <tr valign="top">
                                    <td>  Health consumers  </td>
                                    <td>
                                        <italic>r</italic>
                                        <sub>7</sub> = .649  </td>
                                    <td>  .06  </td>
                                    <td>
                                        <italic>r</italic>
                                        <sub>6</sub> = &#8211;.019  </td>
                                    <td>  .96  </td>
                                </tr>
                            </tbody>
                        </table>
                    </table-wrap>
                    <p>In the case of the hemoglobin A<sub>1</sub>
                        <sub>c</sub> videos, we found a positive and statistically significant correlation for the professionals&#8217; subset (Pearson <italic>r</italic>
                        <sub>10</sub> = .646, <italic>P</italic> = .02). This correlation was weaker with the health consumers but still close to significance levels (<italic>r</italic>
                        <sub>7</sub> = .649, <italic>P</italic> = .06). In the case of the diabetic foot videos, we did not find a statistically significant result in any of the subsets (professionals and consumers).</p>
                </sec>
            </sec>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <sec>
                <title>HealthTrust Metric Performance</title>
                <p>Our results suggest that social network analysis may be used to gather information about the quality of health information. The retrieval of diabetes videos and channels based on the HealthTrust metric performed reasonably well, compared with the YouTube search. In nearly all cases, the precision of the lists retrieved using HealthTrust was better than those retrieved using YouTube. Precision is very important, since in the health-irrelevant content can be potentially very negative (see <xref ref-type="fig" rid="figure10">Figure 10</xref>). It is quite significant that the performance of HealthTrust was equal to or better than that of the YouTube search, considering that YouTube has access to all the metadata about videos and users, while HealthTrust has limited access via its API; for example, some channels restrict access to information about their links (eg, subscriptions).</p>
                <p>It is difficult to identify the exact differences between the YouTube and HealthTrust searches, since YouTube has not published its search algorithm, despite having published its recommended algorithm [<xref ref-type="bibr" rid="ref43">43</xref>]. However, we expect YouTube&#8217;s search engine to be based on link analysis, as are most search engines. The main difference between traditional Web search engines and our approach is that we strengthened the tightly knit community effect [<xref ref-type="bibr" rid="ref19">19</xref>], as with diabetes; traditionally, Web search engines try to reduce the influence of those communities to raise general public satisfaction. Consequently, funny or controversial videos are more popular among the general YouTube community and are therefore more highly rated. These videos lose prominence using HealthTrust. In fact, the search based on the HealthTrust metric performed better than YouTube in filtering out misleading videos (eg, herbal cures or advertisements). The HealthTrust algorithm estimates health-related trust and not general trust on YouTube.</p>
                <fig id="figure10" position="float">
                    <label>Figure 10</label>
                    <caption>
                        <p>Highly ranked YouTube video about diabetic foot featuring an infected wound.</p>
                    </caption>
                    <graphic xlink:href="jmir_v14i1e22_fig10.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>HealthTrust Weaknesses</title>
                <p>Some good videos from trusted sources, such as public health authorities, gained relatively low HealthTrust values. The best explanation for the algorithm&#8217;s behavior is that creators of those videos had fewer connections in the diabetes community. Some of these sources belonged to a more generic health community (eg, CDCStreamingHealth&#8217;s Channel) and therefore had weaker ties with the diabetes community. Also, some trusted sources do not create links with other users (eg, through friendships, subscriptions, or comments). This lack of connectivity leads to lower scores in HealthTrust. As part of our future work, we will design an enhanced version of HealthTrust that calculates trustworthiness values within several health communities.</p>
                <p>Many factors influence the perceived quality of a video beyond trustworthiness and authoritativeness. Therefore, it is not surprising that we did not find statistically significant correlations in all cases. Personal taste and preferences play a major role. For example, the video <italic>O is for outrage &#8211; Type 1 diabetes</italic> (<xref ref-type="fig" rid="figure11">Figure 11</xref>) was given a higher rating by health consumers (average of 4.2) than by professionals (average of 2.75). <italic>O is for outrage</italic> is a video appealing to emotional aspects to raise awareness; it is very engaging to the online diabetes community. However, this particular video is less informative, which may explain why professionals rated it lower. Consequently, a generic quality indicator such as HealthTrust cannot always satisfy everybody.</p>
                <p>There were videos from certain channels with quite different average ratings but the same HealthTrust scores. In such cases, the videos had no links (favorites) but inherited the HealthTrust scores from their channels. An example of this problem is shown in the following two videos from the diabetic foot list for consumers: (1) <italic>Baseball great Ron Santo &#38; Diabetes--INCREDIBLE Story</italic>, and (2) <italic>Miami Ink</italic>
                    <italic>&#8217;</italic>
                    <italic>s Darren Brass: Tattoos and Diabetes</italic>. Both videos have the same HealthTrust score, as both are from the same diabetes channel, dLifedotcom. However, the <italic>Miami Ink</italic> video was less appealing to health consumers. In this case, link analysis was not enough to distinguish the quality between the two videos. The only way to solve this problem is to analyze more data about the video (eg, semantic analysis or ratings).</p>
                <fig id="figure11" position="float">
                    <label>Figure 11</label>
                    <caption>
                        <p>Screenshot from the video <italic>O is for outrage – Type 1 diabetes</italic>.</p>
                    </caption>
                    <graphic xlink:href="jmir_v14i1e22_fig11.png" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Limitations</title>
                <p>In both experiments, some videos or channels were deleted while we were conducting the experiment. In the case of the channel study, two were removed, and in the second study some videos gained lower ratings because they were made private by their authors. It is unlikely that this problem biased our study, since it affected a small sample and it affected all the algorithms equally.</p>
                <p>To be able to generalize our findings, we will have to perform large-scale studies with more queries, reviewers, and videos. Our survey-based evaluation approach is merely an approximation of the real context of health consumers&#8217; search for information. Survey-based evaluation of online videos is very time consuming, as most videos last several minutes. It was necessary to watch around 30 minutes of videos to complete our surveys. Hence, to generalize our findings we are implementing a video portal to capture more data for evaluation within the real user context. The video portal will also need to address the continuous changes in the structure of online communities (eg, reputation changes over time). A possible solution for the dynamic nature of online communities may be periodic calculation of HealthTrust.</p>
                <p>Moreover, it remains to be seen whether our approach will work in health domains where there is a large community of users promoting misleading information. For example, there are communities promoting anorexia as a lifestyle [<xref ref-type="bibr" rid="ref15">15</xref>] or against vaccination [<xref ref-type="bibr" rid="ref14">14</xref>]. Pro-anorexia users will tend to link and endorse misleading information; thus, if HealthTrust is to be used to retrieve trustworthy content about anorexia it must be able to avoid pro-anorexia subcommunities.</p>
                <p>Our current study is limited to online health videos; therefore, we will need to replicate our study with other types of social media in order to generalize our findings. We believe that the metric HealthTrust can be applied to any type of linked health community where users are interconnected via follows, friendships, and favorite content. However, experiments will need to be performed to evaluate the algorithm, since each type of community may have a different structure and dynamics.</p>
                <p>Our study is limited to automatic approaches for extracting trust-based metrics and the feasibility of using these metrics to retrieve health videos. More research will be needed to test how to combine HealthTrust with manual selection of social media by human experts. HealthTrust can be very useful to automatically identify the most trusted sources within the diabetes community. However, some trustworthy providers have very good content but have not gained enough trust within the online community.</p>
            </sec>
            <sec>
                <title>Conclusions</title>
                <p>Every day, millions of health consumers search for health information on social platforms such as YouTube, and retrieving accurate information from trusted sources can often be difficult. There is an unsatisfied need for new information retrieval tools to help health consumers find trustworthy and relevant health information within social media.</p>
                <p>In this paper we present a new metric, called HealthTrust, to infer information about the trustworthiness of social media content within a health community. We tested the feasibility of using HealthTrust for retrieving videos from the diabetes community on YouTube. Based on our evaluation with health consumers and professionals, the search of diabetes content based on the HealthTrust metric performed better than YouTube in nearly all the tested cases. However, a larger study is needed to validate our results in a health portal in order to test the metric in a live setting.</p>
                <p>Despite the limitations of our study, we conclude that, to apply social network analysis to retrieving health information, social media may be used to develop tools that will ultimately help find relevant and trustworthy information. Social network analysis could also be used to reinforce other approaches to health information retrieval such as quality labels and manual review of content.</p>
            </sec>
        </sec>
    </body>
    <back>
        <glossary>
            <title>Abbreviations</title>
            <def-list>
                <def-item>
                    <term id="abb1">API</term>
                    <def>
                        <p> application programming interface</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb2">DCG</term>
                    <def>
                        <p> discounted cumulative gain</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb3">CDC</term>
                    <def>
                        <p> Centers for Disease Control and Prevention</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb4">HITS</term>
                    <def>
                        <p> hyperlink-induced topic search</p>
                    </def>
                </def-item>
            </def-list>
        </glossary>
        <ack>
            <p>We would like to thank our colleagues for their very useful comments, which helped to improve this paper, especially Prof. Joseph A Kostan from the GroupLens group in the Department of Computer Science and Engineering at the University of Minnesota. In addition, we would like to thank the Diabetes Hands Foundation for their support in the recruitment of people with diabetes.</p>
            <p>This project belongs to the Troms&#248; Telemedicine Laboratory cofunded by the Research Council of Norway, project 174934.</p>
        </ack>
        <fn-group>
            <fn fn-type="con">
                <p>LFL was involved in all the research and manuscript preparation.</p>
                <p>RK reviewed the manuscript and advised LFL with regard to the algorithm aspects of the study.</p>
                <p>GBM participated in the study design, institutional review board application, and recruitment, and reviewed the manuscript.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Fox</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <source>Online health search 2006</source>
                    <year>2006</year>
                    <month>10</month>
                    <day>29</day>
                    <access-date>2012-01-26</access-date>
                    <publisher-loc>Washington, DC</publisher-loc>
                    <publisher-name>Pew Internet &#38; American Life Project</publisher-name>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/~/media//Files/Reports/2006/PIP_Online_Health_2006.pdf.pdf">http://www.pewinternet.org/~/media//Files/Reports/2006/PIP_Online_Health_2006.pdf.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">64zCRIRq5</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kummervold</surname>
                            <given-names>PE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chronaki</surname>
                            <given-names>CE</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lausen</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Prokosch</surname>
                            <given-names>HU</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rasmussen</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Santana</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Staniszewski</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wangberg</surname>
                            <given-names>SC</given-names>
                        </name>
                    </person-group>
                    <article-title>eHealth trends in Europe 2005-2007: a population-based survey</article-title>
                    <source>J Med Internet Res</source>
                    <year>2008</year>
                    <volume>10</volume>
                    <issue>4</issue>
                    <fpage>e42</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2008/4/e42/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.1023</pub-id>
                    <pub-id pub-id-type="medline">19017584</pub-id>
                    <pub-id pub-id-type="pii">v10i4e42</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2629359</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kaplan</surname>
                            <given-names>AM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Haenlein</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Users of the world, unite! The challenges and opportunities of social media</article-title>
                    <source>Business Horizons</source>
                    <year>2010</year>
                    <volume>53</volume>
                    <issue>1</issue>
                    <fpage>59</fpage>
                    <lpage>68</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.bushor.2009.09.003</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lau</surname>
                            <given-names>AY</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Siek</surname>
                            <given-names>KA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Fernandez-Luque</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tange</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chhanabhai</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>SY</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Elkin</surname>
                            <given-names>PL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Arjabi</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Walczowski</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ang</surname>
                            <given-names>CS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>The role of social media for patients and consumer health: contribution of the IMIA Consumer Health Informatics Working Group</article-title>
                    <source>Yearb Med Inform</source>
                    <year>2011</year>
                    <volume>6</volume>
                    <issue>1</issue>
                    <fpage>131</fpage>
                    <lpage>8</lpage>
                    <pub-id pub-id-type="medline">21938338</pub-id>
                    <pub-id pub-id-type="pii">me11010131</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Fox</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jones</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <source>The social life of health information</source>
                    <year>2009</year>
                    <month>06</month>
                    <day>11</day>
                    <access-date>2010-12-07</access-date>
                    <publisher-loc>Washington, DC</publisher-loc>
                    <publisher-name>Pew Internet &#38; American Life Project</publisher-name>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/~/media//Files/Reports/2009/PIP_Health_2009.pdf">http://www.pewinternet.org/~/media//Files/Reports/2009/PIP_Health_2009.pdf</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">5uno4xyeW</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Paton</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bamidis</surname>
                            <given-names>PD</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hansen</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cabrer</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Experience in the use of social media in medical and health education: contribution of the IMIA Social Media Working Group</article-title>
                    <source>Yearb Med Inform</source>
                    <year>2011</year>
                    <volume>6</volume>
                    <issue>1</issue>
                    <fpage>21</fpage>
                    <lpage>9</lpage>
                    <pub-id pub-id-type="medline">21938320</pub-id>
                    <pub-id pub-id-type="pii">me11010021</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bennett</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <source>Found in Cache</source>
                    <year>2011</year>
                    <month>10</month>
                    <day>9</day>
                    <access-date>2011-11-06</access-date>
                    <comment>Hospital Social Network List<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://ebennett.org/hsnl/">http://ebennett.org/hsnl/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">62zskSpvI</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="web">
                    <source>YouTube</source>
                    <year>2011</year>
                    <access-date>2011-11-06</access-date>
                    <comment>NHSChoices Channel.  Sep 12<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.youtube.com/user/NHSChoices">http://www.youtube.com/user/NHSChoices</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">62zsQQ4cu</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Greenberg</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>D'Andrea</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lorence</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <article-title>Setting the public agenda for online health search: a white paper and action agenda</article-title>
                    <source>J Med Internet Res</source>
                    <year>2004</year>
                    <month>06</month>
                    <day>8</day>
                    <volume>6</volume>
                    <issue>2</issue>
                    <fpage>e18</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2004/2/e18/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.6.2.e18</pub-id>
                    <pub-id pub-id-type="medline">15249267</pub-id>
                    <pub-id pub-id-type="pii">v6e18</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1550592</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Powell</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kuss</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sa</surname>
                            <given-names>ER</given-names>
                        </name>
                    </person-group>
                    <article-title>Empirical studies assessing the quality of health information for consumers on the world wide web: a systematic review</article-title>
                    <source>JAMA</source>
                    <year>2002</year>
                    <month>05</month>
                    <volume>287</volume>
                    <issue>20</issue>
                    <fpage>2691</fpage>
                    <lpage>700</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jama.ama-assn.org/cgi/pmidlookup?view=long&#38;pmid=12020305" />
                    </comment>
                    <pub-id pub-id-type="medline">12020305</pub-id>
                    <pub-id pub-id-type="pii">jrv10005</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bernstam</surname>
                            <given-names>EV</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Walji</surname>
                            <given-names>MF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sagaram</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sagaram</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Johnson</surname>
                            <given-names>CW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Meric-Bernstam</surname>
                            <given-names>F</given-names>
                        </name>
                    </person-group>
                    <article-title>Commonly cited website quality criteria are not effective at identifying inaccurate online information about breast cancer</article-title>
                    <source>Cancer</source>
                    <year>2008</year>
                    <month>03</month>
                    <day>15</day>
                    <volume>112</volume>
                    <issue>6</issue>
                    <fpage>1206</fpage>
                    <lpage>13</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dx.doi.org/10.1002/cncr.23308" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1002/cncr.23308</pub-id>
                    <pub-id pub-id-type="medline">18266210</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mayer</surname>
                            <given-names>MA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Darmoni</surname>
                            <given-names>SJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Fiene</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>K&#246;hler</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Roth-Berghofer</surname>
                            <given-names>TR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Eysenbach</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <article-title>MedCIRCLE: collaboration for Internet rating, certification, labelling and evaluation of health information on the World-Wide-Web</article-title>
                    <source>Stud Health Technol Inform</source>
                    <year>2003</year>
                    <volume>95</volume>
                    <fpage>667</fpage>
                    <lpage>72</lpage>
                    <pub-id pub-id-type="medline">14664064</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mayer</surname>
                            <given-names>MA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Karkaletsis</surname>
                            <given-names>V</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Stamatakis</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Leis</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Villarroel</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Thomeczek</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Labsk&#253;</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>L&#243;pez-Ostenero</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Honkela</surname>
                            <given-names>T</given-names>
                        </name>
                    </person-group>
                    <article-title>MedIEQ-Quality labelling of medical web content using multilingual information extraction</article-title>
                    <source>Stud Health Technol Inform</source>
                    <year>2006</year>
                    <volume>121</volume>
                    <fpage>183</fpage>
                    <lpage>90</lpage>
                    <pub-id pub-id-type="medline">17095816</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ache</surname>
                            <given-names>KA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wallace</surname>
                            <given-names>LS</given-names>
                        </name>
                    </person-group>
                    <article-title>Human papillomavirus vaccination coverage on YouTube</article-title>
                    <source>Am J Prev Med</source>
                    <year>2008</year>
                    <month>10</month>
                    <volume>35</volume>
                    <issue>4</issue>
                    <fpage>389</fpage>
                    <lpage>92</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.amepre.2008.06.029</pub-id>
                    <pub-id pub-id-type="medline">18675530</pub-id>
                    <pub-id pub-id-type="pii">S0749-3797(08)00597-7</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Norris</surname>
                            <given-names>ML</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Boydell</surname>
                            <given-names>KM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pinhas</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Katzman</surname>
                            <given-names>DK</given-names>
                        </name>
                    </person-group>
                    <article-title>Ana and the Internet: a review of pro-anorexia websites</article-title>
                    <source>Int J Eat Disord</source>
                    <year>2006</year>
                    <month>09</month>
                    <volume>39</volume>
                    <issue>6</issue>
                    <fpage>443</fpage>
                    <lpage>7</lpage>
                    <pub-id pub-id-type="doi">10.1002/eat.20305</pub-id>
                    <pub-id pub-id-type="medline">16721839</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Esquivel</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Meric-Bernstam</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bernstam</surname>
                            <given-names>EV</given-names>
                        </name>
                    </person-group>
                    <article-title>Accuracy and self correction of information received from an internet breast cancer list: content analysis</article-title>
                    <source>BMJ</source>
                    <year>2006</year>
                    <month>04</month>
                    <day>22</day>
                    <volume>332</volume>
                    <issue>7547</issue>
                    <fpage>939</fpage>
                    <lpage>42</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.bmj.com/cgi/pmidlookup?view=long&#38;pmid=16513686" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/bmj.38753.524201.7C</pub-id>
                    <pub-id pub-id-type="medline">16513686</pub-id>
                    <pub-id pub-id-type="pii">bmj.38753.524201.7C</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1444809</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kleinberg</surname>
                            <given-names>JM</given-names>
                        </name>
                    </person-group>
                    <article-title>Authoritative sources in a hyperlinked environment</article-title>
                    <source>J ACM</source>
                    <year>1999</year>
                    <volume>46</volume>
                    <issue>5</issue>
                    <fpage>604</fpage>
                    <lpage>32</lpage>
                    <pub-id pub-id-type="doi">10.1145/324133.324140</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Brin</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Page</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>The anatomy of a large-scale hypertextual Web search engine</article-title>
                    <source>Comput Netw ISDN Syst</source>
                    <year>1998</year>
                    <volume>30</volume>
                    <issue>1-7</issue>
                    <fpage>107</fpage>
                    <lpage>17</lpage>
                    <pub-id pub-id-type="doi">10.1016/S0169-7552(98)00110-X</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lempel</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Moran</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>The stochastic approach for link-structure analysis (SALSA) and the TKC effect</article-title>
                    <source>Comput Netw</source>
                    <year>2000</year>
                    <volume>33</volume>
                    <issue>1-6</issue>
                    <fpage>387</fpage>
                    <lpage>401</lpage>
                    <pub-id pub-id-type="doi">10.1016/S1389-1286(00)00034-7</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Gyongyi</surname>
                            <given-names>Z</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Garcia-Molina</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Pedersen</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Combating web spam with trustrank</article-title>
                    <source>Proceedings</source>
                    <year>2004</year>
                    <conf-name>Thirtieth international Conference on Very Large Data Bases</conf-name>
                    <conf-date>Aug 31-Sept 3, 2004</conf-date>
                    <conf-loc>Toronto, ON, Canada</conf-loc>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://portal.acm.org/citation.cfm?id=1316689.1316740" />
                    </comment>
                </nlm-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Gou</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>HH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kim</surname>
                            <given-names>JH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lee Giles</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>SNDocRank: document ranking based on social networks</article-title>
                    <source>Proceedings</source>
                    <year>2010</year>
                    <conf-name>19th international Conference on World wide web (WWW '10)</conf-name>
                    <conf-date>Apri 27-30, 2010</conf-date>
                    <conf-loc>Raleigh, NC, USA</conf-loc>
                    <pub-id pub-id-type="doi">10.1145/1772690.1772825</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mislove</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Marcon</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gummadi</surname>
                            <given-names>KP</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Druschel</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bhattacharjee</surname>
                            <given-names>B</given-names>
                        </name>
                    </person-group>
                    <article-title>Measurement and analysis of online social networks</article-title>
                    <source>Proceedings</source>
                    <year>2007</year>
                    <conf-name>7th ACM SIGCOMM Conference on Internet Measurement (IMC '07)</conf-name>
                    <conf-date>Oct 24-26, 2007</conf-date>
                    <conf-loc>San Diego, CA, USA</conf-loc>
                    <pub-id pub-id-type="doi">10.1145/1298306.1298311</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Gagliardi</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jadad</surname>
                            <given-names>AR</given-names>
                        </name>
                    </person-group>
                    <article-title>Examination of instruments used to rate quality of health information on the internet: chronicle of a voyage with an unclear destination</article-title>
                    <source>BMJ</source>
                    <year>2002</year>
                    <month>03</month>
                    <day>9</day>
                    <volume>324</volume>
                    <issue>7337</issue>
                    <fpage>569</fpage>
                    <lpage>73</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://bmj.com/cgi/pmidlookup?view=long&#38;pmid=11884320" />
                    </comment>
                    <pub-id pub-id-type="medline">11884320</pub-id>
                    <pub-id pub-id-type="pmcid">PMC78993</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Jadad</surname>
                            <given-names>AR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gagliardi</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>Rating health information on the Internet: navigating to knowledge or to Babel?</article-title>
                    <source>JAMA</source>
                    <year>1998</year>
                    <month>02</month>
                    <day>25</day>
                    <volume>279</volume>
                    <issue>8</issue>
                    <fpage>611</fpage>
                    <lpage>4</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jama.ama-assn.org/cgi/pmidlookup?view=long&#38;pmid=9486757" />
                    </comment>
                    <pub-id pub-id-type="medline">9486757</pub-id>
                    <pub-id pub-id-type="pii">jrv71042</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Walji</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sagaram</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sagaram</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Meric-Bernstam</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Johnson</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mirza</surname>
                            <given-names>NQ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bernstam</surname>
                            <given-names>EV</given-names>
                        </name>
                    </person-group>
                    <article-title>Efficacy of quality criteria to identify potentially harmful information: a cross-sectional survey of complementary and alternative medicine web sites</article-title>
                    <source>J Med Internet Res</source>
                    <year>2004</year>
                    <month>06</month>
                    <day>29</day>
                    <volume>6</volume>
                    <issue>2</issue>
                    <fpage>e21</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2004/2/e21/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.6.2.e21</pub-id>
                    <pub-id pub-id-type="medline">15249270</pub-id>
                    <pub-id pub-id-type="pii">v6e21</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1550600</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>M-Eco Consortium</collab>
                    </person-group>
                    <source>meco-project.eu</source>
                    <year>2010</year>
                    <access-date>2011-11-06</access-date>
                    <comment>M-Eco: Medical EcoSystem<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://meco-project.eu/">http://meco-project.eu/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">62ztB4MY4</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <nlm-citation citation-type="web">
                    <source>Khresmoi</source>
                    <year>2010</year>
                    <access-date>2011-11-06</access-date>
                    <comment>Khresmoi: Medical Information Analysis &#38; Retrieval<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.khresmoi.eu/">http://www.khresmoi.eu/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">62ztdsCrb</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Mayer</surname>
                            <given-names>MA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Karampiperis</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kukurikos</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Karkaletsis</surname>
                            <given-names>V</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Stamatakis</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Villarroel</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Leis</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>Applying Semantic Web technologies to improve the retrieval, credibility and use of health-related web resources</article-title>
                    <source>Health Informatics J</source>
                    <year>2011</year>
                    <month>06</month>
                    <volume>17</volume>
                    <issue>2</issue>
                    <fpage>95</fpage>
                    <lpage>115</lpage>
                    <pub-id pub-id-type="doi">10.1177/1460458211405004</pub-id>
                    <pub-id pub-id-type="medline">21712354</pub-id>
                    <pub-id pub-id-type="pii">17/2/95</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref29">
                <label>29</label>
                <nlm-citation citation-type="web">
                    <source>Merriam-Webster Inc</source>
                    <year>2012</year>
                    <access-date>2011-11-06</access-date>
                    <comment>Definition of Trust<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.merriam-webster.com/dictionary/trust">http://www.merriam-webster.com/dictionary/trust</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">62zttQS1q</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref30">
                <label>30</label>
                <nlm-citation citation-type="web">
                    <source>Merriam-Webster Inc</source>
                    <year>2012</year>
                    <access-date>2011-11-06</access-date>
                    <comment>Definition of Authoritative<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.merriam-webster.com/dictionary/authoritative">http://www.merriam-webster.com/dictionary/authoritative</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">62ztwFea0</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref31">
                <label>31</label>
                <nlm-citation citation-type="web">
                    <source>Merriam-Webster Inc</source>
                    <year>2012</year>
                    <access-date>2011-11-06</access-date>
                    <comment>Definition of Reputation<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.merriam-webster.com/dictionary/reputation">http://www.merriam-webster.com/dictionary/reputation</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">62ztyjbVq</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref32">
                <label>32</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Harris</surname>
                            <given-names>PR</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sillence</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Briggs</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Perceived threat and corroboration: key factors that improve a predictive model of trust in internet-based health information and advice</article-title>
                    <source>J Med Internet Res</source>
                    <year>2011</year>
                    <volume>13</volume>
                    <issue>3</issue>
                    <fpage>e51</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2011/3/e51/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.1821</pub-id>
                    <pub-id pub-id-type="medline">21795237</pub-id>
                    <pub-id pub-id-type="pii">v13i3e51</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3222185</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref33">
                <label>33</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Chin</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chignell</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Automatic detection of cohesive subgroups within social hypertext: a heuristic approach</article-title>
                    <source>N Rev Hypermed Multimed</source>
                    <year>2008</year>
                    <volume>14</volume>
                    <issue>1</issue>
                    <fpage>121</fpage>
                    <lpage>43</lpage>
                    <pub-id pub-id-type="doi">10.1080/13614560802357180</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref34">
                <label>34</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Han</surname>
                            <given-names>YS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kim</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cha</surname>
                            <given-names>JW</given-names>
                        </name>
                    </person-group>
                    <article-title>Evaluation of user reputation on YouTube</article-title>
                    <source>Lect Notes Comput Sci</source>
                    <year>2009</year>
                    <volume>5621</volume>
                    <fpage>346</fpage>
                    <lpage>53</lpage>
                    <pub-id pub-id-type="doi">10.1007/978-3-642-02774-1_38</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref35">
                <label>35</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <collab>JUNG Framework Development Team</collab>
                    </person-group>
                    <source>Sourceforge.net</source>
                    <access-date>2011-11-06</access-date>
                    <comment>JUNG: Java Universal Network/Graph Framework<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jung.sourceforge.net/">http://jung.sourceforge.net/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">62zwuXUxD</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref36">
                <label>36</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Fernandez-Luque</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Elahi</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Grajales</surname>
                            <given-names>FJ</given-names>
                        </name>
                    </person-group>
                    <article-title>An analysis of personal medical information disclosed in YouTube videos created by patients with multiple sclerosis</article-title>
                    <source>Stud Health Technol Inform</source>
                    <year>2009</year>
                    <volume>150</volume>
                    <fpage>292</fpage>
                    <lpage>6</lpage>
                    <pub-id pub-id-type="medline">19745316</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref37">
                <label>37</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Fernandez-Luque</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Karlsen</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Melton</surname>
                            <given-names>GB</given-names>
                        </name>
                    </person-group>
                    <article-title>HealthTrust: trust-based retrieval of YouTube's diabetes channels</article-title>
                    <source>Proceedings</source>
                    <year>2011</year>
                    <conf-name>CIKM '11: 20th ACM International Conference on Information and Knowledge Management</conf-name>
                    <conf-date>Oct 24-28, 2011</conf-date>
                    <conf-loc>Glasgow, UK</conf-loc>
                    <pub-id pub-id-type="doi">10.1145/2063576.2063854</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref38">
                <label>38</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cohen</surname>
                            <given-names>JA</given-names>
                        </name>
                    </person-group>
                    <article-title>Coefficient of agreement for nominal scales</article-title>
                    <source>Educ Psychol Meas</source>
                    <year>1960</year>
                    <month>04</month>
                    <volume>20</volume>
                    <issue>1</issue>
                    <fpage>37</fpage>
                    <lpage>46</lpage>
                    <pub-id pub-id-type="doi">10.1177/001316446002000104</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref39">
                <label>39</label>
                <nlm-citation citation-type="web">
                    <source>Comprehensive R Archive Network</source>
                    <year>2012</year>
                    <access-date>2012-01-30</access-date>
                    <comment>Psych: Procedures for Psychological, Psychometric, and Personality Research<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://cran.r-project.org/web/packages/psych/index.html">http://cran.r-project.org/web/packages/psych/index.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">655E6HDfK</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref40">
                <label>40</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Buettcher</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Clarke</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Cormack</surname>
                            <given-names>G</given-names>
                        </name>
                    </person-group>
                    <source>Information Retrieval: Implementing and Evaluating Search Engines</source>
                    <year>2010</year>
                    <publisher-loc>Cambridge, MA</publisher-loc>
                    <publisher-name>The MIT Press</publisher-name>
                    <fpage>408</fpage>
                </nlm-citation>
            </ref>
            <ref id="ref41">
                <label>41</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>J&#228;rvelin</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kek&#228;l&#228;inen</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Cumulated gain-based evaluation of IR techniques</article-title>
                    <source>ACM Trans Inf Syst</source>
                    <year>2002</year>
                    <volume>20</volume>
                    <issue>4</issue>
                    <fpage>422</fpage>
                    <lpage>46</lpage>
                    <pub-id pub-id-type="doi">10.1145/582415.582418</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref42">
                <label>42</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Rodgers</surname>
                            <given-names>JL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nicewander</surname>
                            <given-names>WA</given-names>
                        </name>
                    </person-group>
                    <article-title>Thirteen ways to look at the correlation coefficient</article-title>
                    <source>Am Stat</source>
                    <year>1988</year>
                    <month>02</month>
                    <volume>42</volume>
                    <issue>1</issue>
                    <fpage>59</fpage>
                    <lpage>66</lpage>
                    <pub-id pub-id-type="doi">10.2307/2685263</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref43">
                <label>43</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Davidson</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Liebald</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Liu</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nandy</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Van Vleet</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gargi</surname>
                            <given-names>U</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gupta</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>He</surname>
                            <given-names>Y</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lambert</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Livingston</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sampath</surname>
                            <given-names>D</given-names>
                        </name>
                    </person-group>
                    <article-title>The YouTube video recommendation system</article-title>
                    <source>Proceedings</source>
                    <year>2010</year>
                    <conf-name>Fourth ACM Conference on Recommender Systems</conf-name>
                    <conf-date>Sept 26-30, 2010</conf-date>
                    <conf-loc>Barcelona, Spain</conf-loc>
                    <pub-id pub-id-type="doi">10.1145/1864708.1864770</pub-id>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>
