<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">JMIR</journal-id>
            <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
            <journal-title>Journal of Medical Internet Research</journal-title>
            <issn pub-type="epub">1438-8871</issn>
            <publisher>
                <publisher-name>JMIR Publications Inc.</publisher-name>
                <publisher-loc>Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v16i10e223</article-id>
            <article-id pub-id-type="pmid">25274020</article-id>
            <article-id pub-id-type="doi">10.2196/jmir.3369</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Original Paper</subject>
                </subj-group>
                <subj-group subj-group-type="article-type">
                    <subject>Original Paper</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Automatic Evidence Retrieval for Systematic Reviews</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="editor">
                    <name>
                        <surname>Eysenbach</surname>
                        <given-names>Gunther</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Badgett</surname>
                        <given-names>Robert</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Wallace</surname>
                        <given-names>Byron</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1">
                    <name name-style="western">
                        <surname>Choong</surname>
                        <given-names>Miew Keen</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-0352-5585</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib2">
                    <name name-style="western">
                        <surname>Galgani</surname>
                        <given-names>Filippo</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-3553-3611</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib3">
                    <name name-style="western">
                        <surname>Dunn</surname>
                        <given-names>Adam G</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-1720-8209</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib4" corresp="yes">
                    <name name-style="western">
                        <surname>Tsafnat</surname>
                        <given-names>Guy</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <address>
                        <institution>Centre for Health Informatics</institution>
                        <institution>Australian Institute of Health Innovation</institution>
                        <institution>University of New South Wales</institution>
                        <addr-line>AGSM Building, Level 1</addr-line>
                        <addr-line>G27, Gate 11 Botany Street</addr-line>
                        <addr-line>Kensington NSW, 2052</addr-line>
                        <country>Australia</country>
                        <phone>61 293858697</phone>
                        <fax>61 293858692</fax>
                        <email>guyt@unsw.edu.au</email>
                    </address>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-4353-2026</ext-link>
                </contrib>
            </contrib-group>
            <aff id="aff1">
                <sup>1</sup>
                <institution>Centre for Health Informatics</institution>
                <institution>Australian Institute of Health Innovation</institution>
                <institution>University of New South Wales</institution>
                <addr-line>Kensington NSW</addr-line>
                <country>Australia</country>
            </aff>
            <author-notes>
                <corresp>Corresponding Author: Guy Tsafnat <email>guyt@unsw.edu.au</email>
                </corresp>
            </author-notes>
            <pub-date pub-type="collection">
                <month>10</month>
                <year>2014</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>01</day>
                <month>10</month>
                <year>2014</year>
            </pub-date>
            <volume>16</volume>
            <issue>10</issue>
            <elocation-id>e223</elocation-id>
            <!--history from ojs - api-xml-->
            <history>
                <date date-type="received">
                    <day>14</day>
                    <month>07</month>
                    <year>2014</year>
                </date>
                <date date-type="rev-request">
                    <day>07</day>
                    <month>08</month>
                    <year>2014</year>
                </date>
                <date date-type="rev-recd">
                    <day>18</day>
                    <month>08</month>
                    <year>2014</year>
                </date>
                <date date-type="accepted">
                    <day>09</day>
                    <month>09</month>
                    <year>2014</year>
                </date>
            </history>
            <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
            <copyright-statement>&#169;Miew Keen Choong, Filippo Galgani, Adam G Dunn, Guy Tsafnat. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 01.10.2014. </copyright-statement>
            <copyright-year>2014</copyright-year>
            <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
                <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
            </license>
            <self-uri xlink:href="http://www.jmir.org/2014/10/e223/" xlink:type="simple" />
            <abstract>
                <sec sec-type="background">
                    <title>Background</title>
                    <p>Snowballing involves recursively pursuing relevant references cited in the retrieved literature and adding them to the search results. Snowballing is an alternative approach to discover additional evidence that was not retrieved through conventional search. Snowballing&#8217;s effectiveness makes it best practice in systematic reviews despite being time-consuming and tedious.</p>
                </sec>
                <sec sec-type="objective">
                    <title>Objective</title>
                    <p>Our goal was to evaluate an automatic method for citation snowballing&#8217;s capacity to identify and retrieve the full text and/or abstracts of cited articles.</p>
                </sec>
                <sec sec-type="methods">
                    <title>Methods</title>
                    <p>Using 20 review articles that contained 949 citations to journal or conference articles, we manually searched Microsoft Academic Search (MAS) and identified 78.0% (740/949) of the cited articles that were present in the database. We compared the performance of the automatic citation snowballing method against the results of this manual search, measuring precision, recall, and F<sub>1</sub> score.</p>
                </sec>
                <sec sec-type="results">
                    <title>Results</title>
                    <p>The automatic method was able to correctly identify 633 (as proportion of included citations: recall=66.7%, F<sub>1</sub> score=79.3%; as proportion of citations in MAS: recall=85.5%, F<sub>1</sub> score=91.2%) of citations with high precision (97.7%), and retrieved the full text or abstract for 490 (recall=82.9%, precision=92.1%, F<sub>1</sub> score=87.3%) of the 633 correctly retrieved citations.</p>
                </sec>
                <sec sec-type="conclusions">
                    <title>Conclusions</title>
                    <p>The proposed method for automatic citation snowballing is accurate and is capable of obtaining the full texts or abstracts for a substantial proportion of the scholarly citations in review articles. By automating the process of citation snowballing, it may be possible to reduce the time and effort of common evidence surveillance tasks such as keeping trial registries up to date and conducting systematic reviews.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>evidence-based medicine</kwd>
                <kwd>medical informatics</kwd>
                <kwd>information storage and retrieval</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title> Introduction</title>
            <p>Evidence retrieval tasks such as literature reviews and decision support, where recall of all relevant evidence is required, cannot rely on search technology alone due to limitations of keyword searching [<xref ref-type="bibr" rid="ref1">1</xref>]. This has led to the development of secondary search methods such as citation tracking, called snowballing [<xref ref-type="bibr" rid="ref2">2</xref>], and citation pearl growing [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>].</p>
            <p>Snowballing involves recursively pursuing relevant references cited in already-retrieved literature and adding them to the search results. Thus, snowballing is not limited to citation information found in bibliographical databases. The technical challenges of snowballing include obtaining the full text of retrieved citations, recognizing citation strings in the text, and retrieving new citations from citation strings. These make snowballing both tedious and time consuming.</p>
            <p>Unlike keyword searching, snowballing does not require specific search terms [<xref ref-type="bibr" rid="ref5">5</xref>], which are variable and inconsistent. Rather, it can be thought of as relying on the accumulation of multiple searches from different publishing authors [<xref ref-type="bibr" rid="ref6">6</xref>]. Snowballing is a complementary approach to search for discovering additional evidence. Demonstrably, snowballing improves retrieval&#8212;for example, case studies using search and forward citation tracking on depression and coronary heart disease have been shown to identify more eligible articles than search alone [<xref ref-type="bibr" rid="ref6">6</xref>]. A review on checking reference lists to find additional studies for systematic reviews found that citation tracking increased the yield of search results by 2.5-43% [<xref ref-type="bibr" rid="ref7">7</xref>]. Snowballing is considered best practice and is frequently recommended when conducting systematic reviews [<xref ref-type="bibr" rid="ref2">2</xref>]. With the rapid increase in the rate of publication, automation of snowballing would significantly reduce the time dedicated to literature search.</p>
            <p>We tested an approach to automatic snowballing that uses citation extraction algorithms and scientific search engines to follow the steps of snowballing: (1) extract citation strings from documents, (2) find the citations, (3) fetch the full text of citations, and (4) repeat the process to recursively retrieve more citations. The goal of this study is to test the feasibility of automating each of the subtasks of snowballing.</p>
        </sec>
        <sec sec-type="methods">
            <title> Methods</title>
            <sec>
                <title>Algorithm</title>
                <p>With an initial set of at least one paper, portable document format (PDF) and hypertext markup language (HTML) documents are converted to plain text. A modified version of ParsCit [<xref ref-type="bibr" rid="ref8">8</xref>] (a free and open source reference strings segmentation package) identifies reference sections and segments individual reference strings. We modified the heuristics in ParsCit and changed the restriction by allowing the reference label to be found from the middle (50%) to the end of the text. Each reference is converted to a search engine query by removing short words, numbers, and punctuation. The query results returned from the search engine contain citation information (eg, authors, titles, journal, year, digital object identifiers [DOI]) and often one or more links (uniform resource locator [URL]) to full text. We extracted and followed links to the full text. The source code is available in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref> and [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
            </sec>
            <sec>
                <title>Data</title>
                <p>In the evaluation, we used citations from a set of published English language reviews about neuraminidase inhibitors. The dataset consisted of 152 systematic and non-systematic review articles. We randomly selected a subset of 20 review articles that contained 1057 citations. We excluded references to websites, books, book chapters, newspaper articles, and grey literature, leaving 949 included citations. The properties of the 20 review articles are provided in <xref ref-type="app" rid="app2">Multimedia Appendix 2</xref>.</p>
            </sec>
            <sec>
                <title>Study Design</title>
                <p>We evaluated our algorithm using the proportion of extracted references, the proportion of citations retrieved, and the proportion of abstracts and full texts downloaded. We checked extracted citations manually against the references in the paper. We considered a reference to be correctly extracted only if it contained the entire reference without loss of information. We did allow for minimal extra information, such as white space and citation number but not information that should have been part of another citation string, page footer or manuscript text. The accuracy of the retrieved citations and abstract/full text with the references from the systematic reviews were verified manually. Correctly retrieved articles were counted as true positives. Retrieved articles that are not the ones cited were counted as false positives.</p>
                <p>We used Microsoft Academic Search (MAS) [<xref ref-type="bibr" rid="ref10">10</xref>] (<xref ref-type="fig" rid="figure1">Figure 1</xref>) in the evaluation. MAS is a generalized scientific literature search engine that covers more than 48 million publications with weekly updates. A free application programming interface (API) is provided for non-commercial purposes after registration. Citations include bibliographic data as well as links to citing papers and links to multiple versions of the paper if more than one version exists, including, often, to full text. We used the MAS API to perform searches for each of the references extracted from the full text of the original paper. Other search engines (eg, Google Scholar [<xref ref-type="bibr" rid="ref11">11</xref>]) can also be used in this step, subject to restrictions they impose. We chose MAS due to its size, &#8220;cited by&#8221; functionality, links to full text, and because it does not enforce active blocking to prevent automated access.</p>
                <p>We manually searched for missed references to ascertain whether they were indeed indexed in MAS. Articles that were not retrieved but were found by manual search of MAS were counted as false negatives. We calculated precision, recall, and F<sub>1</sub> score using the standard formulae:</p>
                <p>Precision = (True positives) / (True positives + False positives)</p>
                <p>Recall = (True positives) / (True positives + False negatives)</p>
                <p>F<sub>1</sub> score = 2 x Precision x Recall / (Precision + Recall)</p>
                <p>The precision, recall, and F<sub>1</sub> scores were computed for retrieval of citations, abstract (only abstracts or abstracts with full texts), and full text against all citations (1057 references), included citations (949 references), and included citations indexed in MAS (740 references).</p>
                <p>All experiments were conducted on computers with Internet protocols (IP) allocated to the University of New South Wales. Journals that automatically recognize subscription by IP address and to which the University of New South Wales library is subscribed were thus granted access. No other subscription activation or authentication methods were used. However, since most abstracts are freely accessible, download of abstracts will not normally be affected by journal subscription.</p>
                <fig id="figure1" position="float">
                    <label>Figure 1</label>
                    <caption>
                        <p>Microsoft Academic Search (MAS).</p>
                    </caption>
                    <graphic xlink:href="jmir_v16i10e223_fig1.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
        </sec>
        <sec sec-type="results">
            <title> Results</title>
            <p>The summary of the evaluation is shown in <xref ref-type="fig" rid="figure2">Figure 2</xref>. We successfully extracted 97.2% (922/949) of the included citations (96.5%, 1020/1057 citations) from the 20 reviews randomly selected. The precision, recall and F<sub>1</sub> scores for retrieval of citations, abstract (only abstracts or abstracts with full texts), and full text fetching of citations from the 20 randomly selected review articles are shown in <xref ref-type="table" rid="table1">Table 1</xref>. The scores are computed using three categories: (1) all citations, (2) included citations, and (3) included citations indexed in MAS. The first category shows the probability to retrieve a given reference from a review paper. The second category gives the same probability but excludes works not likely to be retrievable such as books and grey literature. The third category excludes citations not currently indexed in MAS.</p>
            <p>For the reference strings indexed in MAS, 66.2% (490/740) of abstracts were correctly downloaded either on their own or as part of the full text. These represent 51.6% of 949 included citations and 46.4% of all 1057 references included in the study.</p>
            <p>Out of the 633 correctly identified citations, we retrieved the full text or abstract for 490 (recall=82.9%, precision=92.1%, F<sub>1</sub> score=87.3%). We examined the specific reasons why 143 (22.6%) of the articles were not downloaded automatically. MAS had incorrect links for 39 articles (6.2%), and no link to full text for 6 articles (0.9%); 56 links (8.8%) led to a page that uses JavaScript to dynamically create a link to the full text. For citations where only abstracts were downloaded (15 abstracts), full text documents were not downloaded due to journal subscription access.</p>
            <table-wrap position="float" id="table1">
                <label>Table 1</label>
                <caption>
                    <p>Results of citations, abstract, and full text retrieval (precision, recall, and F<sub>1</sub> score of database results fetch, and full text and abstract retrieval, comparing all reference strings, only included citations, and only included citations indexed in MAS).</p>
                </caption>
                <table width="800" border="1" cellpadding="7" cellspacing="0" rules="groups" frame="hsides">
                    <col width="89" />
                    <col width="65" />
                    <col width="135" />
                    <col width="154" />
                    <col width="149" />
                    <thead>
                        <tr valign="top">
                            <td colspan="2">
                                <break />
                            </td>
                            <td>As proportion of all citations (n=1057)</td>
                            <td>As proportion of included citations (n=949)</td>
                            <td>As proportion of citations in MAS (n=740)</td>
                        </tr>
                    </thead>
                    <tbody>
                        <tr valign="top">
                            <td colspan="5">
                                <bold>Citations retrieved</bold>
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>Precision</td>
                            <td>0.977</td>
                            <td>0.977</td>
                            <td>0.977</td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>Recall</td>
                            <td>0.600</td>
                            <td>0.667</td>
                            <td>0.855</td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>F<sub>1</sub>score</td>
                            <td>0.743</td>
                            <td>0.793</td>
                            <td>0.912</td>
                        </tr>
                        <tr valign="top">
                            <td colspan="5">
                                <bold>Abstracts fetched</bold>
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>Precision</td>
                            <td>0.921</td>
                            <td>0.921</td>
                            <td>0.921</td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>Recall</td>
                            <td>0.483</td>
                            <td>0.540</td>
                            <td>0.702</td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>F<sub>1</sub>score</td>
                            <td>0.634</td>
                            <td>0.681</td>
                            <td>0.797</td>
                        </tr>
                        <tr valign="top">
                            <td colspan="5">
                                <bold>Full text fetched</bold>
                            </td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>Precision</td>
                            <td>0.919</td>
                            <td>0.919</td>
                            <td>0.919</td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>Recall</td>
                            <td>0.475</td>
                            <td>0.533</td>
                            <td>0.696</td>
                        </tr>
                        <tr valign="top">
                            <td>
                                <break />
                            </td>
                            <td>F<sub>1</sub>score</td>
                            <td>0.626</td>
                            <td>0.674</td>
                            <td>0.792</td>
                        </tr>
                    </tbody>
                </table>
            </table-wrap>
            <fig id="figure2" position="float">
                <label>Figure 2</label>
                <caption>
                    <p>Summary of the evaluation results (from 20 reviews with 949 scholarly citations, MAS included 740 citations, 633 citations were found, and 490 full texts and abstracts were downloaded automatically).</p>
                </caption>
                <graphic xlink:href="jmir_v16i10e223_fig2.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
            </fig>
        </sec>
        <sec sec-type="discussion">
            <title> Discussion</title>
            <sec>
                <title>Principal Findings</title>
                <p>Snowballing is tedious and resource demanding but has shown to improve retrieval. This evaluation shows that it is feasible to automatically perform snowballing using our method by extracting and downloading the citations. Systems designed to perform many of the systematic review tasks are already in use, in development, or in research [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. This study represents a first effort to automate the snowballing tasks in a systematic review process. When integrated with a reliable automatic screening tool, automatic snowballing can have a compound effect and increase recall [<xref ref-type="bibr" rid="ref12">12</xref>].</p>
                <p>Automatic citation extraction is a difficult task [<xref ref-type="bibr" rid="ref14">14</xref>], which causes the citation retrieval to be an even harder task. However, if unique identifier of citations (eg, DOI or PubMed identifier) is provided for each citation, this would greatly improve the reliability of citation extraction and retrieval.</p>
            </sec>
            <sec>
                <title>Limitations</title>
                <p>A limitation of this study is that full text fetching is tested on journal subscription by IP address and to which the University of New South Wales library is subscribed. While this means that results may vary in other institutions, they also represent an exemplar that may guide expectations of results. With the growth of open source and other means of obtaining full text [<xref ref-type="bibr" rid="ref15">15</xref>], the performance of our algorithm may improve.</p>
                <p>In this evaluation, the algorithm was limited to MAS. This is a constraint of the testing system, not of the method. From the limited testing we have conducted, the algorithm performs equivalently on Google Scholar but computer-access restrictions prevented a robust comparison.</p>
                <p>Some existing databases, such as Scopus [<xref ref-type="bibr" rid="ref16">16</xref>] and Web of Science [<xref ref-type="bibr" rid="ref17">17</xref>] (subscription fees apply for both), provide citation analysis and allow one to search both forward (references cited in an investigated text) and backward (papers citing an investigated text) and can thus aid manual snowballing. However, those citations are limited to papers indexed in the respective database. Our method automatically extracts citations directly from documents and can thus cross database boundaries.</p>
            </sec>
            <sec>
                <title>Conclusions</title>
                <p>Snowballing is automatable and can reduce the time and effort of evidence retrieval. It is possible to reliably extracts reference lists from the text of scientific papers, find these citations in scientific search engines, and fetch the full text and/or abstract.</p>
            </sec>
        </sec>
    </body>
    <back>
        <app-group>
            <app id="app1">
                <title>Multimedia Appendix 1</title>
                <p>Source code http://www2.chi.unsw.edu.au/~miewkeen/ESuRFr.html.</p>
                <media xlink:href="jmir_v16i10e223_app1.zip" xlink:title="ZIP File (Zip Archive), 1MB" />
            </app>
            <app id="app2">
                <title>Multimedia Appendix 2</title>
                <p>Properties of the 20 review articles included in the study.</p>
                <media xlink:href="jmir_v16i10e223_app2.pdf" xlink:title="PDF File (Adobe PDF File), 3KB" />
            </app>
        </app-group>
        <glossary>
            <title>Abbreviations</title>
            <def-list>
                <def-item>
                    <term id="abb1">API</term>
                    <def>
                        <p>application programming interface</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb2">DOI</term>
                    <def>
                        <p>digital object identifier</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb3">IP</term>
                    <def>
                        <p>Internet protocol</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb4">MAS</term>
                    <def>
                        <p>Microsoft Academic Search</p>
                    </def>
                </def-item>
            </def-list>
        </glossary>
        <ack>
            <p>This work was supported by a National Health &#38; Medical Research Council Centre for Research Excellence in eHealth Grant APP1032664.</p>
        </ack>
        <fn-group>
            <fn fn-type="conflict">
                <p>None declared.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ceri</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bozzon</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Brambilla</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Della Valle</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Fraternali</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Quarteroni</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <person-group person-group-type="editor">
                        <name name-style="western">
                            <surname>Carey</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ceri</surname>
                            <given-names>S</given-names>
                        </name>
                    </person-group>
                    <article-title>The information retrieval process</article-title>
                    <source>Web Information Retrieval</source>
                    <year>2013</year>
                    <publisher-loc>Heidelberg</publisher-loc>
                    <publisher-name>Springer</publisher-name>
                    <fpage>13</fpage>
                    <lpage>26</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Greenhalgh</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Peacock</surname>
                            <given-names>R</given-names>
                        </name>
                    </person-group>
                    <article-title>Effectiveness and efficiency of search methods in systematic reviews of complex evidence: audit of primary sources</article-title>
                    <source>BMJ</source>
                    <year>2005</year>
                    <month>11</month>
                    <day>5</day>
                    <volume>331</volume>
                    <issue>7524</issue>
                    <fpage>1064</fpage>
                    <lpage>5</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/16230312" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/bmj.38636.593461.68</pub-id>
                    <pub-id pub-id-type="medline">16230312</pub-id>
                    <pub-id pub-id-type="pii">bmj.38636.593461.68</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1283190</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Ramer</surname>
                            <given-names>SL</given-names>
                        </name>
                    </person-group>
                    <article-title>Site-ation pearl growing: methods and librarianship history and theory</article-title>
                    <source>J Med Libr Assoc</source>
                    <year>2005</year>
                    <month>07</month>
                    <volume>93</volume>
                    <issue>3</issue>
                    <fpage>397</fpage>
                    <lpage>400</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/16059431" />
                    </comment>
                    <pub-id pub-id-type="medline">16059431</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1175807</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="web">
                    <source>Search Strategies and Heuristics for Searching Bibliographic and Full Text Databases</source>
                    <access-date>2014-08-12</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://dspace.creighton.edu/xmlui/bitstream/handle/10504/5903/Searching%20Databases%20-%20Strategies%20and%20Heuristics.pdf?sequence=1">https://dspace.creighton.edu/xmlui/bitstream/handle/10504/5903/Searching%20Databases%20-%20Strategies%20and%20Heuristics.pdf?sequence=1</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6RlPHoDrK</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Robinson</surname>
                            <given-names>KA</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dunn</surname>
                            <given-names>AG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tsafnat</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Glasziou</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Citation networks of related trials are often disconnected: implications for bidirectional citation searches</article-title>
                    <source>J Clin Epidemiol</source>
                    <year>2014</year>
                    <month>07</month>
                    <volume>67</volume>
                    <issue>7</issue>
                    <fpage>793</fpage>
                    <lpage>9</lpage>
                    <pub-id pub-id-type="doi">10.1016/j.jclinepi.2013.11.015</pub-id>
                    <pub-id pub-id-type="medline">24725642</pub-id>
                    <pub-id pub-id-type="pii">S0895-4356(14)00026-2</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kuper</surname>
                            <given-names>H</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Nicholson</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hemingway</surname>
                            <given-names>H</given-names>
                        </name>
                    </person-group>
                    <article-title>Searching for observational studies: what does citation tracking add to PubMed? A case study in depression and coronary heart disease</article-title>
                    <source>BMC Med Res Methodol</source>
                    <year>2006</year>
                    <volume>6</volume>
                    <fpage>4</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.biomedcentral.com/1471-2288/6/4" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1186/1471-2288-6-4</pub-id>
                    <pub-id pub-id-type="medline">16483366</pub-id>
                    <pub-id pub-id-type="pii">1471-2288-6-4</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1403794</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Horsley</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dingwall</surname>
                            <given-names>O</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sampson</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>Checking reference lists to find additional studies for systematic reviews</article-title>
                    <source>Cochrane Database Syst Rev</source>
                    <year>2011</year>
                    <issue>8</issue>
                    <fpage>MR000026</fpage>
                    <pub-id pub-id-type="doi">10.1002/14651858.MR000026.pub2</pub-id>
                    <pub-id pub-id-type="medline">21833989</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Councill</surname>
                            <given-names>IG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Giles</surname>
                            <given-names>CL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kan</surname>
                            <given-names>MY</given-names>
                        </name>
                    </person-group>
                    <article-title>ParsCit: an open-source CRF reference string parsing package</article-title>
                    <source>Proceedings of the Sixth International Language Resources and Evaluation</source>
                    <year>2008</year>
                    <conf-name>International Language Resources and Evaluation Conference</conf-name>
                    <conf-date>May 2008</conf-date>
                    <conf-loc>Marrakesh, Morrocco</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="web">
                    <source>Evidence Discovery using Microsoft Academic Search (MAS) Sample Code version 0.1</source>
                    <access-date>2014-08-12</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www2.chi.unsw.edu.au/~miewkeen/ESuRFr.html">http://www2.chi.unsw.edu.au/~miewkeen/ESuRFr.html</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6RlLz49RD</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="web">
                    <source>Microsoft Academic Search</source>
                    <access-date>2014-07-14</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://academic.research.microsoft.com/">http://academic.research.microsoft.com/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6R35GdAH5</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="web">
                    <source>Google Scholar</source>
                    <access-date>2014-07-14</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://scholar.google.com.au/">http://scholar.google.com.au/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6R35D2LI2</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Tsafnat</surname>
                            <given-names>G</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Glasziou</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Choong</surname>
                            <given-names>MK</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dunn</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Galgani</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Coiera</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Systematic review automation technologies</article-title>
                    <source>Syst Rev</source>
                    <year>2014</year>
                    <volume>3</volume>
                    <fpage>74</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.systematicreviewsjournal.com/content/3//74" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1186/2046-4053-3-74</pub-id>
                    <pub-id pub-id-type="medline">25005128</pub-id>
                    <pub-id pub-id-type="pii">2046-4053-3-74</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4100748</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wallace</surname>
                            <given-names>BC</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dahabreh</surname>
                            <given-names>IJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schmid</surname>
                            <given-names>CH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lau</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Trikalinos</surname>
                            <given-names>TA</given-names>
                        </name>
                    </person-group>
                    <article-title>Modernizing the systematic review process to inform comparative effectiveness: tools and methods</article-title>
                    <source>J Comp Eff Res</source>
                    <year>2013</year>
                    <month>05</month>
                    <volume>2</volume>
                    <issue>3</issue>
                    <fpage>273</fpage>
                    <lpage>82</lpage>
                    <pub-id pub-id-type="doi">10.2217/cer.13.17</pub-id>
                    <pub-id pub-id-type="medline">24236626</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Day</surname>
                            <given-names>MY</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tsai</surname>
                            <given-names>TH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sung</surname>
                            <given-names>CL</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lee</surname>
                            <given-names>CW</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wu</surname>
                            <given-names>SH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ong</surname>
                            <given-names>CS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hsu</surname>
                            <given-names>WL</given-names>
                        </name>
                    </person-group>
                    <article-title>A knowledge-based approach to citation extraction</article-title>
                    <year>2005</year>
                    <conf-name>IEEE International Conference on Information Reuse and Integration</conf-name>
                    <conf-date>August 15-17, 2005</conf-date>
                    <conf-loc>Las Vegas, NV</conf-loc>
                    <fpage>50</fpage>
                    <lpage>55</lpage>
                    <pub-id pub-id-type="doi">10.1109/IRI-05.2005.1506448</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Dunn</surname>
                            <given-names>AG</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Coiera</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mandl</surname>
                            <given-names>KD</given-names>
                        </name>
                    </person-group>
                    <article-title>Is Biblioleaks inevitable?</article-title>
                    <source>J Med Internet Res</source>
                    <year>2014</year>
                    <volume>16</volume>
                    <issue>4</issue>
                    <fpage>e112</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2014/4/e112/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.3331</pub-id>
                    <pub-id pub-id-type="medline">24755534</pub-id>
                    <pub-id pub-id-type="pii">v16i4e112</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4019771</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="web">
                    <source>Scopus</source>
                    <access-date>2014-07-14</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.scopus.com/">http://www.scopus.com/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6R35JZXxj</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="web">
                    <source>Web of Science</source>
                    <access-date>2014-07-14</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://thomsonreuters.com/thomson-reuters-web-of-science/">http://thomsonreuters.com/thomson-reuters-web-of-science/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6R35Kw0b4</pub-id>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>
