<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v22i8e16709</article-id>
      <article-id pub-id-type="pmid">32755895</article-id>
      <article-id pub-id-type="doi">10.2196/16709</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Reproducible Machine Learning Methods for Lung Cancer Detection Using Computed Tomography Images: Algorithm Development and Validation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Shull</surname>
            <given-names>Jessica</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Morid</surname>
            <given-names>Mohammad</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>Kun-Hsing</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9892-8218</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Tsung-Lu Michael</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4453-3151</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Yen</surname>
            <given-names>Ming-Hsuan</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1644-950X</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Kou</surname>
            <given-names>S C</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1774-3316</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Rosen</surname>
            <given-names>Bruce</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff7" ref-type="aff">7</xref>
          <xref rid="aff8" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8576-0839</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Chiang</surname>
            <given-names>Jung-Hsien</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <address>
            <institution>Department of Computer Science and Information Engineering</institution>
            <institution>National Cheng Kung University</institution>
            <addr-line>No 1 University Road</addr-line>
            <addr-line>Tainan</addr-line>
            <country>Taiwan</country>
            <phone>886 6 2757575 ext 62534</phone>
            <email>jchiang@mail.ncku.edu.tw</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4657-6705</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Kohane</surname>
            <given-names>Isaac S</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff8" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2192-5160</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Biomedical Informatics</institution>
        <institution>Harvard Medical School</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Statistics</institution>
        <institution>Harvard University</institution>
        <addr-line>Cambridge, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Pathology</institution>
        <institution>Brigham and Women's Hospital</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Information Engineering</institution>
        <institution>Kun Shan University</institution>
        <addr-line>Tainan</addr-line>
        <country>Taiwan</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Graduate Program of Multimedia Systems and Intelligent Computing</institution>
        <institution>National Cheng Kung University and Academia Sinica</institution>
        <addr-line>Tainan</addr-line>
        <country>Taiwan</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Department of Computer Science and Information Engineering</institution>
        <institution>National Cheng Kung University</institution>
        <addr-line>Tainan</addr-line>
        <country>Taiwan</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Department of Radiology, Athinoula A Martinos Center for Biomedical Imaging</institution>
        <institution>Massachusetts General Hospital</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff8">
        <label>8</label>
        <institution>Division of Health Sciences and Technology</institution>
        <institution>Harvard–Massachusetts Institute of Technology</institution>
        <addr-line>Boston, MA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Jung-Hsien Chiang <email>jchiang@mail.ncku.edu.tw</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>8</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>5</day>
        <month>8</month>
        <year>2020</year>
      </pub-date>
      <volume>22</volume>
      <issue>8</issue>
      <elocation-id>e16709</elocation-id>
      <history>
        <date date-type="received">
          <day>17</day>
          <month>10</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>18</day>
          <month>5</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>25</day>
          <month>5</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>11</day>
          <month>6</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Kun-Hsing Yu, Tsung-Lu Michael Lee, Ming-Hsuan Yen, S C Kou, Bruce Rosen, Jung-Hsien Chiang, Isaac S Kohane. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 05.08.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2020/8/e16709" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Chest computed tomography (CT) is crucial for the detection of lung cancer, and many automated CT evaluation methods have been proposed. Due to the divergent software dependencies of the reported approaches, the developed methods are rarely compared or reproduced.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The goal of the research was to generate reproducible machine learning modules for lung cancer detection and compare the approaches and performances of the award-winning algorithms developed in the Kaggle Data Science Bowl.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We obtained the source codes of all award-winning solutions of the Kaggle Data Science Bowl Challenge, where participants developed automated CT evaluation methods to detect lung cancer (training set n=1397, public test set n=198, final test set n=506). The performance of the algorithms was evaluated by the log-loss function, and the Spearman correlation coefficient of the performance in the public and final test sets was computed.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Most solutions implemented distinct image preprocessing, segmentation, and classification modules. Variants of U-Net, VGGNet, and residual net were commonly used in nodule segmentation, and transfer learning was used in most of the classification algorithms. Substantial performance variations in the public and final test sets were observed (Spearman correlation coefficient = .39 among the top 10 teams). To ensure the reproducibility of results, we generated a Docker container for each of the top solutions.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>We compared the award-winning algorithms for lung cancer detection and generated reproducible Docker images for the top solutions. Although convolutional neural networks achieved decent accuracy, there is plenty of room for improvement regarding model generalizability.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>computed tomography, spiral</kwd>
        <kwd>lung cancer</kwd>
        <kwd>machine learning</kwd>
        <kwd>early detection of cancer</kwd>
        <kwd>reproducibility of results</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Lung cancer is one of the most prevalent cancers worldwide, causing 1.76 million deaths per year [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Chest computed tomography (CT) scans play an essential role in the screening for [<xref ref-type="bibr" rid="ref3">3</xref>] and diagnosis of lung cancer [<xref ref-type="bibr" rid="ref4">4</xref>]. A randomized controlled trial demonstrated that low-dose CT screening reduced mortality from lung cancer among high-risk patients [<xref ref-type="bibr" rid="ref3">3</xref>], and recent studies showed the benefit of CT screening in community settings [<xref ref-type="bibr" rid="ref5">5</xref>]. The wide adoption of lung cancer screening is expected to benefit millions of people [<xref ref-type="bibr" rid="ref6">6</xref>]. However, millions of CT scan images obtained from patients constitute a heavy workload for radiologists [<xref ref-type="bibr" rid="ref7">7</xref>]. In addition, interrater disagreement has been documented [<xref ref-type="bibr" rid="ref8">8</xref>]. Previous studies suggested that computer-aided diagnostic systems could improve the detection of pulmonary nodules in CT examination [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref12">12</xref>]. To stimulate the development of machine learning models for automated CT diagnosis, the Kaggle Data Science Bowl provided labeled chest CT images from 1397 patients and awarded $1 million in prizes to the best algorithms for automated lung cancer diagnosis, which is the largest machine learning challenge on medical imaging to date. In response, 1972 teams worldwide have participated and 394 teams have completed all phases of the competition [<xref ref-type="bibr" rid="ref13">13</xref>], making it the largest health care–related Kaggle contest [<xref ref-type="bibr" rid="ref14">14</xref>]. This provides a unique opportunity to study the robustness of medical machine learning models and compare the performance of various strategies for processing and classifying chest CT images at scale.</p>
      <p>Due to the improved performance of machine learning algorithms for radiology diagnosis, some developers have sought commercialization of their models. However, given the divergent software platforms, packages, and patches employed by different teams, their results were not easily reproducible. The difficulty in reusing the state-of-the-art models and reproducing the diagnostic performance markedly hindered further validation and applications.</p>
      <p>To address this gap, we reimplemented, examined, and systematically compared the algorithms and software codes developed by the best-performing teams of the Kaggle Data Science Bowl. Specifically, we investigated all modules developed by the 10 award-winning teams, including their image preprocessing, segmentation, and classification algorithms. To ensure the reproducibility of results and the reusability of the developed modules, we generated a Docker image for each solution using the Docker Community Edition, a popular open-source software development platform that allows users to create self-contained systems with the desired version of software packages, patches, and environmental settings. According to Docker, there are over 6 million Dockerized applications, with 130 billion total downloads [<xref ref-type="bibr" rid="ref15">15</xref>]. The Docker images are easily transferrable from one server to another, which ensures the reproducibility of scientific computing [<xref ref-type="bibr" rid="ref16">16</xref>]. Our Dockerized modules will facilitate further development of computer-aided diagnostic algorithms for chest CT images and contribute to precision oncology.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data and Classification Models</title>
        <p>We obtained the low-dose chest CT datasets in Digital Imaging and Communications in Medicine format from the Kaggle Data Science Bowl website [<xref ref-type="bibr" rid="ref13">13</xref>]. The dataset was acquired from patients with high risks for developing lung cancers. In this Kaggle challenge, a training set (n=1397) with ground truth labels (362 with lung cancer; 1035 without) and a public test set (n=198) without labels were provided to the participants. The ground truth label is 1 if the patient developed lung cancer within 1 year of the date the CT scan was performed and 0 otherwise. The diagnosis was confirmed by pathology evaluation as a part of the National Lung Screening Trial [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. Once participants submitted the prediction results for the public test set, the Kaggle competition platform reported their models’ performance on the public leaderboard instantaneously. The final test set (n=506, ground truth labels were not disclosed to participants) was only available to participants after the model submission deadline, thus serving as an independent validation set that decided the final winners. The chest CT images in the training set, public test set, and final test set all came from multiple hospitals and had different qualities. In particular, the final test set contained more recent and higher quality data with thinner slice thickness than those in the two other sets [<xref ref-type="bibr" rid="ref18">18</xref>].</p>
        <p>To systematically compare the solutions developed by the award-winning teams, we acquired the source codes of the winning solutions and their documentation from the Kaggle news release after the conclusion of the competition. Per the rules of this Kaggle challenge, the source codes of these award-winning solutions were required to be released under open-source licenses approved by the Open Source Initiative [<xref ref-type="bibr" rid="ref19">19</xref>] in order to facilitate free distribution and derivation of the solution codes [<xref ref-type="bibr" rid="ref20">20</xref>]. The default license is the MIT license [<xref ref-type="bibr" rid="ref20">20</xref>]. Under the open-source licenses approved by Open Source Initiative, the software can be freely used, modified, and shared [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
      </sec>
      <sec>
        <title>Comparison of the Approaches and Their Performance</title>
        <p>We compared the workflows of the top 10 solutions by examining and rerunning their source codes. For each solution, we inspected all steps taken from inputting the CT images to outputting the prediction. We documented the versions of the software package and platform dependencies of each solution.</p>
        <p>The Kaggle Data Science Bowl used the log-loss function to evaluate the performance of the models [<xref ref-type="bibr" rid="ref13">13</xref>]. The log-loss function <graphic xlink:href="jmir_v22i8e16709_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/> where n is the number of patients in the test set, <italic>y<sub>i</sub></italic> is 1 if patient i has lung cancer, 0 otherwise, and <italic>ŷ<sub>i</sub></italic> is the predicted probability that patient i has lung cancer [<xref ref-type="bibr" rid="ref13">13</xref>]. If the predicted outcome is set as 0.5 for all patients, the log-loss value would be ln (2) ≈ 0.69.</p>
        <p>To investigate whether models with high performance in the public test set generalize to the images in the final test set, we computed the Spearman correlation coefficient of the log-loss in the two test sets. All analyses were conducted using R version 3.6 (R Foundation for Statistical Computing).</p>
      </sec>
      <sec>
        <title>Docker Image Generation for the Top Ten Solutions</title>
        <p>We reproduced the results by recompiling the source codes and dependencies of each of the top ten solutions. Since the solutions used various platforms and different versions of custom software packages, many of which were not compatible with the most updated packages or mainstream release, we generated Docker images [<xref ref-type="bibr" rid="ref16">16</xref>] to manage the software dependencies and patches required by each solution to enhance the reusability and reproducibility of the developed algorithms.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Performance Comparison</title>
        <p><xref rid="figure1" ref-type="fig">Figure 1</xref> summarizes the public and private test set scores of the top 250 teams that participated in the Kaggle Data Science Bowl. Results showed that the top 20 teams achieved a log-loss less than 0.5 in the final test set, and more than 80 submissions reached a log-loss less than 0.6 in the same set. However, these models had varying performances in the public test set. Surprisingly, 11 out of the top 50 teams had a public test set log-loss greater than 0.69, which was worse than blindly submitting “0.5” as the cancer probability for every patient. The correlation between the public test set scores and the final test set scores was weak among all teams that completed the contest (Spearman correlation coefficient = .23; <xref rid="figure2" ref-type="fig">Figure 2</xref>A). In the top 10 teams, the correlation is moderate (Spearman correlation coefficient = .39; <xref rid="figure2" ref-type="fig">Figure 2</xref>B).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>The log-loss score distribution of the top 250 teams in the Kaggle Data Science Bowl Competition. The log-loss scores of the public test set and the final test set of each team were plotted. The red horizontal line indicates the log-loss of outputting the cancer probability as 0.5 for each patient. The blue horizontal line shows the log-loss of outputting cancer probability of each patient as the prevalence of cancer (0.26) in the training set.</p>
          </caption>
          <graphic xlink:href="jmir_v22i8e16709_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>A weak to moderate correlation between the log-loss scores of the public test set and the scores of the final test set. The red regression line shows the relation between the log-loss scores of the public test set and those of the final test set using a linear regression model. (A) The log-transformed scores of all participants who finished both stages of the Kaggle Data Science Bowl Competition were plotted. The Spearman correlation coefficient of the performance in the two test sets is .23. (B) The log-transformed scores of the top 10 teams defined by the final test set performance. The Spearman correlation coefficient among the top 10 teams is .39.</p>
          </caption>
          <graphic xlink:href="jmir_v22i8e16709_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Workflow Comparison</title>
        <p><xref rid="figure3" ref-type="fig">Figure 3</xref> summarizes the most frequently used strategy by the winning teams. Most solutions used additional publicly available datasets, generated lung segmentation, rescaled the voxels, and performed nodule segmentations before fitting the classification models. <xref ref-type="table" rid="table1">Table 1</xref> compares the additional datasets, data preprocessing, segmentation, classification, implementation, and final test set scores of the top 10 solutions.</p>
        <p>In addition to the training dataset provided by the Kaggle challenge, most teams used CT images and nodule annotations from other publicly available resources. <xref ref-type="table" rid="table2">Table 2</xref> summarizes the sample size, availability of nodule locations, nodule segmentation, diagnoses, other characteristics of the Kaggle dataset, and additional datasets employed by the participants. Most of the top solutions used images and nodule segmentations from the Lung Nodule Analysis 2016 (LUNA16) challenge to develop their segmentation algorithms. LUNA16 is a closely related competition organized in 2016 with an aim to detect lung nodules in chest CT images [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Two teams also reported using the lung CT images, diagnostic annotations, and nodule location data from the International Society for Optics and Photonics (SPIE)–American Association of Physicists in Medicine (AAPM) Lung CT Challenge [<xref ref-type="bibr" rid="ref23">23</xref>], but one of them did not incorporate this relatively small dataset (n=70) when building the final models. Only one of the top 10 teams did not use any additional datasets outside of the competition.</p>
        <p>Frequently used image preprocessing steps include lung segmentation and voxel scaling. Voxel scaling ensures that the voxels of images from various CT scan protocols correspond to similar sizes of physical space. Variants of U-Net [<xref ref-type="bibr" rid="ref24">24</xref>], VGGNet [<xref ref-type="bibr" rid="ref25">25</xref>], and residual net (ResNet) [<xref ref-type="bibr" rid="ref26">26</xref>] were commonly used as the nodule segmentation algorithms, and the nodule segmentation models trained on the LUNA16 dataset were often applied to the Data Science Bowl dataset.</p>
        <p>After lung nodule segmentation, classification algorithms were employed to generate final cancer versus noncancer predictions. Most of the solutions leveraged existing ImageNet-based architecture and transfer learning [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. All teams employed 2D or 3D convolutional neural networks (CNN). A few teams employed CNNs as feature extractors and used tree-based classifiers for this classification task.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>A model of the informatics workflow used by most teams. In addition to the Kaggle training set, most teams obtained additional publicly available datasets with annotations. Lung segmentation, image rescaling, and nodule segmentation modules were commonly used before classification.</p>
          </caption>
          <graphic xlink:href="jmir_v22i8e16709_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Comparisons of the top-performing solutions of the Kaggle Data Science Bowl.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="60"/>
            <col width="120"/>
            <col width="120"/>
            <col width="200"/>
            <col width="130"/>
            <col width="180"/>
            <col width="90"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td>Rank</td>
                <td>Team name</td>
                <td>Additional datasets used</td>
                <td>Data preprocessing</td>
                <td>Nodule segmentation</td>
                <td>Classification algorithms</td>
                <td>Implementation</td>
                <td>Final test set score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>Grt123</td>
                <td>LUNA16<sup>a</sup></td>
                <td>Lung segmentation, intensity normalization</td>
                <td>Variant of U-Net</td>
                <td>Neural network with a max-pooling layer and two fully connected layers</td>
                <td>Pytorch</td>
                <td>0.39975</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>Julian de Wit and Daniel Hammack</td>
                <td>LUNA16, LIDC<sup>b</sup></td>
                <td>Rescale to 1×1×1</td>
                <td>C3D<sup>c</sup>, ResNet-like CNN<sup>d</sup></td>
                <td>C3D, ResNet-like CNN</td>
                <td>Keras, Tensorflow, Theano</td>
                <td>0.40117</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>Aidence</td>
                <td>LUNA16</td>
                <td>Rescale to 2.5×0.512×0.512 (for nodule detection) and 1.25×0.5×0.5 (for classification)</td>
                <td>ResNet<sup>e</sup></td>
                <td>3D DenseNet<sup>f</sup> multitask model (different loss functions depending on the input source)</td>
                <td>Tensorflow</td>
                <td>0.40127</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>qfpxfd</td>
                <td>LUNA16, SPIE-AAPM<sup>g</sup></td>
                <td>Lung segmentation</td>
                <td>Faster R-CNN<sup>h</sup>, with 3D CNN for false positive reduction</td>
                <td>3D CNN inspired by VGGNet</td>
                <td>Keras, Tensorflow, Caffe</td>
                <td>0.40183</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>Pierre Fillard (Therapixel)</td>
                <td>LUNA16</td>
                <td>Rescale to 0.625×0.625×0.625, lung segmentation</td>
                <td>3D CNN inspired by VGGNet</td>
                <td>3D CNN inspired by VGGNet</td>
                <td>Tensorflow</td>
                <td>0.40409</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>MDai</td>
                <td>None</td>
                <td>Rescale to 1×1×1, normalize HU<sup>i</sup></td>
                <td>2D and 3D ResNet</td>
                <td>3D ResNet + a Xgboost classifier incorporating CNN output, patient sex, # nodules, and other nodule features</td>
                <td>Keras, Tensorflow, Xgboost</td>
                <td>0.41629</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>DL Munich</td>
                <td>LUNA16</td>
                <td>Rescale to 1×1×1, lung segmentation</td>
                <td>U-Net</td>
                <td>2D and 3D residual neural network</td>
                <td>Tensorflow</td>
                <td>0.42751</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>Alex, Andre, Gilberto, and Shize</td>
                <td>LUNA16</td>
                <td>Rescale to 2×2×2</td>
                <td>Variant of U-Net</td>
                <td>CNN, tree-based classifiers (with better performance)</td>
                <td>Keras, Theano, xgboost, extraTree</td>
                <td>0.43019</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>Deep Breath</td>
                <td>LUNA16, SPIE-AAPM<sup>j</sup></td>
                <td>Lung mask</td>
                <td>Variant of SegNet</td>
                <td>Inception-ResNet v2</td>
                <td>Theano and Lasagne</td>
                <td>0.43872</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>Owkin Team</td>
                <td>LUNA16</td>
                <td>Lung segmentation</td>
                <td>U-Net, 3D VGGNet</td>
                <td>Gradient boosting</td>
                <td>Keras, Tensorflow, xgboost</td>
                <td>0.44068</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>LUNA16: Lung Nodule Analysis 2016.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>LIDC: Lung Image Database Consortium.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>C3D: convolutional 3D.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>ResNet-like CNN: residual net–like convolutional neural network.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>ResNet: residual net.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup>DenseNet: dense convolutional network.</p>
            </fn>
            <fn id="table1fn7">
              <p><sup>g</sup>SPIE-AAPM: International Society for Optics and Photonics–American Association of Physicists in Medicine Lung CT Challenge.</p>
            </fn>
            <fn id="table1fn8">
              <p><sup>h</sup>R-CNN: region-based convolutional neural networks.</p>
            </fn>
            <fn id="table1fn9">
              <p><sup>i</sup>HU: Hounsfield unit.</p>
            </fn>
            <fn id="table1fn10">
              <p><sup>j</sup>Dataset has been evaluated but not used in building the final model.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>A summary of the chest computed tomography datasets employed by the participants.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="290"/>
            <col width="160"/>
            <col width="140"/>
            <col width="120"/>
            <col width="120"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td>Datasets</td>
                <td>Number of CT<sup>a</sup> scan series</td>
                <td>Data originated from multiple sites</td>
                <td>Availability of nodule locations</td>
                <td>Availability of nodule segmentations</td>
                <td>Availability of patients’ diagnoses (benign versus malignant)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Kaggle Data Science Bowl (this competition)</td>
                <td>Training: 1397; public test set: 198; final test set: 506</td>
                <td>Yes</td>
                <td>No</td>
                <td>No</td>
                <td>Yes</td>
              </tr>
              <tr valign="top">
                <td>Lung nodule analysis</td>
                <td>888</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>Yes</td>
              </tr>
              <tr valign="top">
                <td>SPIE-AAPM<sup>b</sup> Lung CT Challenge</td>
                <td>70</td>
                <td>No</td>
                <td>Yes</td>
                <td>No</td>
                <td>Yes</td>
              </tr>
              <tr valign="top">
                <td>Lung Image Database Consortium</td>
                <td>1398</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>Yes</td>
                <td>Yes</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>CT: computed tomography.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>SPIE-AAPM: International Society for Optics and Photonics–American Association of Physicists in Medicine.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Comparison of the Implementation Platforms and Software Dependencies</title>
        <p>Most of the winning teams developed their modules with Keras and Tensorflow. Only one team used Pytorch (the top-performing team), Caffe, or Lasagne. All of the top 10 teams employed a number of python packages for scientific computing and image processing, including NumPy, SciPy, and Scikit-image (skimage). A summary of package dependencies is shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>. This reflected the popularity of the tools for processing chest CT images, building neural networks, and scientific computing among the top contestants of this contest.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>The most widely used dependencies by the top 10 teams. The packages are ordered by their prevalence among the top teams. For simplicity, dependencies used by only one team are omitted from the figure.</p>
          </caption>
          <graphic xlink:href="jmir_v22i8e16709_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Docker Images of the Top Solutions</title>
        <p>To facilitate reusing the code developed by the top teams, we generated a Docker image for each of the available solutions. Our developed Docker images are redistributed under the open-source licenses chosen by the original developers [<xref ref-type="bibr" rid="ref28">28</xref>]. Detailed instructions on accessing the Docker images can be found on GitHub [<xref ref-type="bibr" rid="ref29">29</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This is the first study that systematically compared the algorithms and implementations of award-winning pulmonary nodule classifiers. Results showed that the majority of the best-performing solutions used additional datasets to train the pulmonary nodule segmentation models. The top solutions used different data preprocessing, segmentation, and classification algorithms. Nonetheless, they only differ slightly in their final test set scores.</p>
        <p>The most commonly used data preprocessing steps were lung segmentation and voxel scaling [<xref ref-type="bibr" rid="ref30">30</xref>]. For nodule classification, many solutions used CNNs. However, 2 of the top 10 teams employed tree-based methods for cancer versus noncancer classification. Tree-based approaches require a predefined set of image features, whereas CNNs allow data to refine the definition of features [<xref ref-type="bibr" rid="ref31">31</xref>]. Given sufficient sample size, CNNs outperformed tree-based methods in many image-related tasks [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref32">32</xref>], whereas tree-based methods could reach satisfactory performance when the sample size was small, and they provided better model interpretability [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref35">35</xref>]. Since the conclusion of the contest, additional works on machine learning for CT evaluation have been published [<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref40">40</xref>]. Nonetheless, these works reported similar strategies for data processing and classification overall.</p>
        <p>To enhance the reproducibility of the developed modules, we generated a Docker image for each of the award-winning solutions. The Docker images contain all software dependencies and patches required by the source codes and are portable to various computing environments [<xref ref-type="bibr" rid="ref16">16</xref>], which will expedite the application and improvement of the state-of-the-art CT analytical modules implemented by the contest winners.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Since it was difficult to compile and release a large deidentified chest CT dataset to the public, the public test set only contains images from 198 patients. Leveraging the 5-digit precision of the log-loss value shown on the leaderboard, one participant implemented and shared a method for identifying all ground truth labels in the public test set during the competition [<xref ref-type="bibr" rid="ref41">41</xref>]. Several participants successfully replicated this approach and got perfect scores on the public leaderboard. Thus, solutions with very low log-loss in the public test set may result from information leakage. Interestingly, among the top-10 models defined by the final test set, 2 performed worse than random guessing in the public test set, which raised concerns on their generalizability [<xref ref-type="bibr" rid="ref42">42</xref>].</p>
        <p>There are several approaches future contest organizers can take to ensure the generalizability of the developed models. First, a multistage competition can filter out the overfitted models using the first private test set and only allow reasonable models to advance to the final evaluation. In addition, organizers can discourage leaderboard probing by only showing the performance of a random subset of the public test data or limiting the number of submissions allowed per day. Finally, curating a larger test set can better evaluate the true model performance and reduce random variability [<xref ref-type="bibr" rid="ref43">43</xref>]. If data deidentification is difficult, requiring contestants to submit their models to a secure computing environment rather than distributing the test data to the participants can minimize the risk of leaking identifiable medical information.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>In summary, we compared, reproduced, and Dockerized state-of-the-art pulmonary nodule segmentation and classification modules. Results showed that many transfer learning approaches achieved reasonable accuracy in diagnosing chest CT images. Future works on additional data collections and validation will further enhance the generalizability of the current methods.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AAPM</term>
          <def>
            <p>American Association of Physicists in Medicine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CNN</term>
          <def>
            <p>convolutional neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CT</term>
          <def>
            <p>computed tomography</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">LUNA16</term>
          <def>
            <p>Lung Nodule Analysis 2016</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ResNet</term>
          <def>
            <p>residual net</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">skimage</term>
          <def>
            <p>Scikit-image</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">SPIE</term>
          <def>
            <p>International Society for Optics and Photonics</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors express their appreciation to Dr Steven Seltzer for his feedback on the manuscript; Drs Shann-Ching Chen, Albert Tsung-Ying Ho, and Luke Kung for identifying the data resources; Dr Mu-Hung Tsai for pointing out the computing resources; and Ms Samantha Lemos and Nichole Parker for their administrative support. K-HY is a Harvard Data Science Fellow. This work was supported in part by the Blavatnik Center for Computational Biomedicine Award and grants from the Office of the Director, National Institutes of Health (grant number OT3OD025466), and the Ministry of Science and Technology Research Grant, Taiwan (grant numbers MOST 103-2221-E-006-254-MY2 and MOST 103-2221-E-168-019). The authors thank the Amazon Web Services Cloud Credits for Research, Microsoft Azure Research Award, and the NVIDIA Corporation for their support on the computational infrastructure. This work used the Extreme Science and Engineering Discovery Environment Bridges Pylon at the Pittsburgh Supercomputing Center (through allocation TG-BCS180016), which is supported by the National Science Foundation (grant number ACI-1548562).</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Torre</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Bray</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Siegel</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Ferlay</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lortet-Tieulent</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jemal</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Global cancer statistics 2012</article-title>
          <source>CA Cancer J Clin</source>
          <year>2015</year>
          <month>03</month>
          <volume>65</volume>
          <issue>2</issue>
          <fpage>87</fpage>
          <lpage>108</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.3322/caac.21262"/>
          </comment>
          <pub-id pub-id-type="doi">10.3322/caac.21262</pub-id>
          <pub-id pub-id-type="medline">25651787</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bray</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ferlay</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Soerjomataram</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Siegel</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Torre</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Jemal</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Global cancer statistics 2018: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title>
          <source>CA Cancer J Clin</source>
          <year>2018</year>
          <month>09</month>
          <day>12</day>
          <volume>68</volume>
          <issue>6</issue>
          <fpage>394</fpage>
          <lpage>424</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3322/caac.21492"/>
          </comment>
          <pub-id pub-id-type="doi">10.3322/caac.21492</pub-id>
          <pub-id pub-id-type="medline">30207593</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aberle</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Berg</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Black</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Clapp</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Fagerstrom</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Gareen</surname>
              <given-names>IF</given-names>
            </name>
            <name name-style="western">
              <surname>Gatsonis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Marcus</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Sicks</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Reduced lung-cancer mortality with low-dose computed tomographic screening</article-title>
          <source>N Engl J Med</source>
          <year>2011</year>
          <month>08</month>
          <day>4</day>
          <volume>365</volume>
          <issue>5</issue>
          <fpage>395</fpage>
          <lpage>409</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21714641"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMoa1102873</pub-id>
          <pub-id pub-id-type="medline">21714641</pub-id>
          <pub-id pub-id-type="pmcid">PMC4356534</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gould</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Donington</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>WR</given-names>
            </name>
            <name name-style="western">
              <surname>Mazzone</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Midthun</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Naidich</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Wiener</surname>
              <given-names>RS</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of individuals with pulmonary nodules: when is it lung cancer? Diagnosis and management of lung cancer, 3rd ed: American College of Chest Physicians evidence-based clinical practice guidelines</article-title>
          <source>Chest</source>
          <year>2013</year>
          <month>05</month>
          <volume>143</volume>
          <issue>5 Suppl</issue>
          <fpage>e93S</fpage>
          <lpage>e120S</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23649456"/>
          </comment>
          <pub-id pub-id-type="doi">10.1378/chest.12-2351</pub-id>
          <pub-id pub-id-type="medline">23649456</pub-id>
          <pub-id pub-id-type="pii">S0012-3692(13)60291-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC3749714</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>VK</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dowling</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Singhal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Young</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Cabebe</surname>
              <given-names>EC</given-names>
            </name>
          </person-group>
          <article-title>Community low-dose CT lung cancer screening: a prospective cohort study</article-title>
          <source>Lung</source>
          <year>2015</year>
          <month>02</month>
          <volume>193</volume>
          <issue>1</issue>
          <fpage>135</fpage>
          <lpage>139</lpage>
          <pub-id pub-id-type="doi">10.1007/s00408-014-9671-9</pub-id>
          <pub-id pub-id-type="medline">25503535</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moyer</surname>
              <given-names>VA</given-names>
            </name>
            <collab>U.S. Preventive Services Task Forsce</collab>
          </person-group>
          <article-title>Screening for lung cancer: U.S. Preventive Services Task Force recommendation statement</article-title>
          <source>Ann Intern Med</source>
          <year>2014</year>
          <month>03</month>
          <day>4</day>
          <volume>160</volume>
          <issue>5</issue>
          <fpage>330</fpage>
          <lpage>338</lpage>
          <pub-id pub-id-type="doi">10.7326/M13-2771</pub-id>
          <pub-id pub-id-type="medline">24378917</pub-id>
          <pub-id pub-id-type="pii">1809422</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gurcan</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Sahiner</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Petrick</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kazerooni</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Cascade</surname>
              <given-names>PN</given-names>
            </name>
            <name name-style="western">
              <surname>Hadjiiski</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Lung nodule detection on thoracic computed tomography images: preliminary evaluation of a computer-aided diagnosis system</article-title>
          <source>Med Phys</source>
          <year>2002</year>
          <month>11</month>
          <volume>29</volume>
          <issue>11</issue>
          <fpage>2552</fpage>
          <lpage>2558</lpage>
          <pub-id pub-id-type="doi">10.1118/1.1515762</pub-id>
          <pub-id pub-id-type="medline">12462722</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Gierada</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Pinsky</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sanders</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fineberg</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nath</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Reader variability in identifying pulmonary nodules on chest radiographs from the national lung screening trial</article-title>
          <source>J Thorac Imaging</source>
          <year>2012</year>
          <month>07</month>
          <volume>27</volume>
          <issue>4</issue>
          <fpage>249</fpage>
          <lpage>254</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22627615"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/RTI.0b013e318256951e</pub-id>
          <pub-id pub-id-type="medline">22627615</pub-id>
          <pub-id pub-id-type="pmcid">PMC3409316</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doi</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Computer-aided diagnosis in medical imaging: historical review, current status and future potential</article-title>
          <source>Comput Med Imaging Graph</source>
          <year>2007</year>
          <volume>31</volume>
          <issue>4-5</issue>
          <fpage>198</fpage>
          <lpage>211</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/17349778"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.compmedimag.2007.02.002</pub-id>
          <pub-id pub-id-type="medline">17349778</pub-id>
          <pub-id pub-id-type="pii">S0895-6111(07)00026-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC1955762</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rubin</surname>
              <given-names>GD</given-names>
            </name>
            <name name-style="western">
              <surname>Lyo</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Paik</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Sherbondy</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chow</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Leung</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Mindelzun</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Schraedley-Desmond</surname>
              <given-names>PK</given-names>
            </name>
            <name name-style="western">
              <surname>Zinck</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Naidich</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Napel</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Pulmonary nodules on multi-detector row CT scans: performance comparison of radiologists and computer-aided detection</article-title>
          <source>Radiology</source>
          <year>2005</year>
          <month>01</month>
          <volume>234</volume>
          <issue>1</issue>
          <fpage>274</fpage>
          <lpage>283</lpage>
          <pub-id pub-id-type="doi">10.1148/radiol.2341040589</pub-id>
          <pub-id pub-id-type="medline">15537839</pub-id>
          <pub-id pub-id-type="pii">2341040589</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Awai</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Murao</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ozawa</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Komi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hayakawa</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hori</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nishimura</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Pulmonary nodules at chest CT: effect of computer-aided diagnosis on radiologists' detection performance</article-title>
          <source>Radiology</source>
          <year>2004</year>
          <month>02</month>
          <volume>230</volume>
          <issue>2</issue>
          <fpage>347</fpage>
          <lpage>352</lpage>
          <pub-id pub-id-type="doi">10.1148/radiol.2302030049</pub-id>
          <pub-id pub-id-type="medline">14752180</pub-id>
          <pub-id pub-id-type="pii">230/2/347</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Beam</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>IS</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in healthcare</article-title>
          <source>Nat Biomed Eng</source>
          <year>2018</year>
          <month>10</month>
          <volume>2</volume>
          <issue>10</issue>
          <fpage>719</fpage>
          <lpage>731</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41551-018-0305-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41551-018-0305-z</pub-id>
          <pub-id pub-id-type="medline">31015651</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41551-018-0305-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
          <article-title>Data Science Bowl 2017</article-title>
          <source>Kaggle Inc</source>
          <access-date>2020-07-12</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.kaggle.com/c/data-science-bowl-2017">https://www.kaggle.com/c/data-science-bowl-2017</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
          <article-title>Healthcare 2020</article-title>
          <source>Kaggle Inc</source>
          <access-date>2020-07-12</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.kaggle.com/tags/healthcare">https://www.kaggle.com/tags/healthcare</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="web">
          <source>About Docker</source>
          <access-date>2020-07-12</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.docker.com/company">https://www.docker.com/company</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boettiger</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>An introduction to Docker for reproducible research</article-title>
          <source>SIGOPS Oper Syst Rev</source>
          <year>2015</year>
          <month>01</month>
          <day>20</day>
          <volume>49</volume>
          <issue>1</issue>
          <fpage>71</fpage>
          <lpage>79</lpage>
          <pub-id pub-id-type="doi">10.1145/2723872.2723882</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>National Lung Screening Trial Research Team</collab>
            <name name-style="western">
              <surname>Aberle</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Berg</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Black</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Church</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Fagerstrom</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Galen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gareen</surname>
              <given-names>IF</given-names>
            </name>
            <name name-style="western">
              <surname>Gatsonis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Goldin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gohagan</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Hillman</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Jaffe</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kramer</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Marcus</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Schnall</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zylak</surname>
              <given-names>CJ</given-names>
            </name>
          </person-group>
          <article-title>The National Lung Screening Trial: overview and study design</article-title>
          <source>Radiology</source>
          <year>2011</year>
          <month>01</month>
          <volume>258</volume>
          <issue>1</issue>
          <fpage>243</fpage>
          <lpage>253</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21045183"/>
          </comment>
          <pub-id pub-id-type="doi">10.1148/radiol.10091808</pub-id>
          <pub-id pub-id-type="medline">21045183</pub-id>
          <pub-id pub-id-type="pii">radiol.10091808</pub-id>
          <pub-id pub-id-type="pmcid">PMC3009383</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
          <article-title>Data Science Bowl 2017: data description</article-title>
          <source>Kaggle Inc</source>
          <access-date>2020-07-12</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.kaggle.com/c/data-science-bowl-2017/data">https://www.kaggle.com/c/data-science-bowl-2017/data</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
          <source>Open Source Initiative</source>
          <access-date>2020-07-12</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://opensource.org/">https://opensource.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
          <article-title>Data Science Bowl 2017: rules</article-title>
          <source>Kaggle Inc</source>
          <access-date>2020-07-12</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.kaggle.com/c/data-science-bowl-2017/rules">https://www.kaggle.com/c/data-science-bowl-2017/rules</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Setio</surname>
              <given-names>AAA</given-names>
            </name>
            <name name-style="western">
              <surname>Traverso</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>de Bel</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Berens</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Bogaard</surname>
              <given-names>CVD</given-names>
            </name>
            <name name-style="western">
              <surname>Cerello</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Dou</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Fantacci</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Geurts</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gugten</surname>
              <given-names>RVD</given-names>
            </name>
            <name name-style="western">
              <surname>Heng</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Jansen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>de Kaste</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Kotov</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>JY</given-names>
            </name>
            <name name-style="western">
              <surname>Manders</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Sóñora-Mengana</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>García-Naranjo</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Papavasileiou</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Prokop</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Saletta</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schaefer-Prokop</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Scholten</surname>
              <given-names>ET</given-names>
            </name>
            <name name-style="western">
              <surname>Scholten</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Snoeren</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Torres</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>Vandemeulebroucke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Walasek</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Zuidhof</surname>
              <given-names>GC</given-names>
            </name>
            <name name-style="western">
              <surname>Ginneken</surname>
              <given-names>BV</given-names>
            </name>
            <name name-style="western">
              <surname>Jacobs</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Validation, comparison, and combination of algorithms for automatic detection of pulmonary nodules in computed tomography images: the LUNA16 challenge</article-title>
          <source>Med Image Analysis</source>
          <year>2017</year>
          <month>12</month>
          <volume>42</volume>
          <fpage>1</fpage>
          <lpage>13</lpage>
          <pub-id pub-id-type="doi">10.1016/j.media.2017.06.015</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Armato</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>McLennan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bidaut</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>McNitt-Gray</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Meyer</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Reeves</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Aberle</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Henschke</surname>
              <given-names>CI</given-names>
            </name>
            <name name-style="western">
              <surname>Hoffman</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Kazerooni</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>MacMahon</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Van Beeke</surname>
              <given-names>EJR</given-names>
            </name>
            <name name-style="western">
              <surname>Yankelevitz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Biancardi</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Bland</surname>
              <given-names>PH</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Engelmann</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Laderach</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Max</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pais</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Qing</surname>
              <given-names>DPY</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>RY</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Starkey</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Batrah</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Caligiuri</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Farooqi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gladish</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Jude</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Munden</surname>
              <given-names>RF</given-names>
            </name>
            <name name-style="western">
              <surname>Petkovska</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Quint</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Sundaram</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Dodd</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Fenimore</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gur</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Petrick</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Freymann</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kirby</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hughes</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Casteele</surname>
              <given-names>AV</given-names>
            </name>
            <name name-style="western">
              <surname>Gupte</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sallamm</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Heath</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Kuhn</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Dharaiya</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Burns</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Fryd</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Salganicoff</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Anand</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Shreter</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Vastagh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Croft</surname>
              <given-names>BY</given-names>
            </name>
          </person-group>
          <article-title>The Lung Image Database Consortium (LIDC) and Image Database Resource Initiative (IDRI): a completed reference database of lung nodules on CT scans</article-title>
          <source>Med Phys</source>
          <year>2011</year>
          <month>02</month>
          <volume>38</volume>
          <issue>2</issue>
          <fpage>915</fpage>
          <lpage>931</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21452728"/>
          </comment>
          <pub-id pub-id-type="doi">10.1118/1.3528204</pub-id>
          <pub-id pub-id-type="medline">21452728</pub-id>
          <pub-id pub-id-type="pmcid">PMC3041807</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Armato</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Drukker</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Hadjiiski</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tourassi</surname>
              <given-names>GD</given-names>
            </name>
            <name name-style="western">
              <surname>Engelmann</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Giger</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Redmond</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Farahani</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kirby</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>LP</given-names>
            </name>
          </person-group>
          <article-title>LUNGx Challenge for computerized lung nodule classification</article-title>
          <source>J Med Imaging (Bellingham)</source>
          <year>2016</year>
          <month>10</month>
          <volume>3</volume>
          <issue>4</issue>
          <fpage>044506</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28018939"/>
          </comment>
          <pub-id pub-id-type="doi">10.1117/1.JMI.3.4.044506</pub-id>
          <pub-id pub-id-type="medline">28018939</pub-id>
          <pub-id pub-id-type="pii">16082R</pub-id>
          <pub-id pub-id-type="pmcid">PMC5166709</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ronneberger</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Fischer</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Brox</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Navab</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hornegger</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wells</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Frangi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>U-Net: convolutional networks for biomedical image segmentation</article-title>
          <source>Medical Image Computing and Computer-Assisted Intervention—MICCAI 2015. Lecture Notes in Computer Science, vol 9351</source>
          <year>2015</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Simonyan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zisserman</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Very deep convolutional networks for large-scale image recognition</article-title>
          <source>arXiv preprint arXiv</source>
          <year>2014</year>
          <fpage>14091556</fpage>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Deep residual learning for image recognition</article-title>
          <year>2016</year>
          <conf-name>IEEE Conference on Computer Vision and Pattern Recognition</conf-name>
          <conf-date>2016</conf-date>
          <conf-loc>Las Vegas</conf-loc>
          <pub-id pub-id-type="doi">10.1109/cvpr.2016.90</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Roth</surname>
              <given-names>HR</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Nogues</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mollura</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Summers</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Deep convolutional neural networks for computer-aided detection: CNN architectures, dataset characteristics and transfer learning</article-title>
          <source>IEEE Trans Med Imaging</source>
          <year>2016</year>
          <month>5</month>
          <volume>35</volume>
          <issue>5</issue>
          <fpage>1285</fpage>
          <lpage>1298</lpage>
          <pub-id pub-id-type="doi">10.1109/tmi.2016.2528162</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <source>DockerHub</source>
          <access-date>2020-07-12</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://rebrand.ly/chestct">https://rebrand.ly/chestct</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <source>Docker images for chest CT analyses</source>
          <access-date>2020-07-12</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/khyu/dsb_chestct">https://github.com/khyu/dsb_chestct</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lifton</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Malcolm</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McBride</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cross</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <source>The application of voxel size correction in X-ray computed tomography for dimensional metrology</source>
          <year>2013</year>
          <access-date>2020-07-12</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ndt.net/article/SINCE2013/content/papers/24_Lifton.pdf">https://www.ndt.net/article/SINCE2013/content/papers/24_Lifton.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Berry</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ré</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Snyder</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>IS</given-names>
            </name>
          </person-group>
          <article-title>Classifying non-small cell lung cancer types and transcriptomic subtypes using convolutional neural networks</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2020</year>
          <month>05</month>
          <day>01</day>
          <volume>27</volume>
          <issue>5</issue>
          <fpage>757</fpage>
          <lpage>769</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocz230</pub-id>
          <pub-id pub-id-type="medline">32364237</pub-id>
          <pub-id pub-id-type="pii">5828209</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Russakovsky</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Krause</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Satheesh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Karpathy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Khosla</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Berg</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Fei-Fei</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>ImageNet large scale visual recognition challenge</article-title>
          <source>Int J Comput Vis</source>
          <year>2015</year>
          <month>4</month>
          <day>11</day>
          <volume>115</volume>
          <issue>3</issue>
          <fpage>211</fpage>
          <lpage>252</lpage>
          <pub-id pub-id-type="doi">10.1007/s11263-015-0816-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Berry</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rubin</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Ré</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Snyder</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Association of omics features with histopathology patterns in lung adenocarcinoma</article-title>
          <source>Cell Syst</source>
          <year>2017</year>
          <month>12</month>
          <day>27</day>
          <volume>5</volume>
          <issue>6</issue>
          <fpage>620</fpage>
          <lpage>627</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2405-4712(17)30484-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cels.2017.10.014</pub-id>
          <pub-id pub-id-type="medline">29153840</pub-id>
          <pub-id pub-id-type="pii">S2405-4712(17)30484-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC5746468</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Berry</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Altman</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Ré</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rubin</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Snyder</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Predicting non-small cell lung cancer prognosis by fully automated microscopic pathology image features</article-title>
          <source>Nat Commun</source>
          <year>2016</year>
          <month>12</month>
          <day>16</day>
          <volume>7</volume>
          <fpage>12474</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nature.com/articles/ncomms12474#supplementary-information"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/ncomms12474</pub-id>
          <pub-id pub-id-type="medline">27527408</pub-id>
          <pub-id pub-id-type="pii">ncomms12474</pub-id>
          <pub-id pub-id-type="pmcid">PMC4990706</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fitzpatrick</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Pappas</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kung</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Snyder</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Omics AnalySIs System for PRecision Oncology (OASISPRO): a web-based omics analysis tool for clinical phenotype prediction</article-title>
          <source>Bioinformatics</source>
          <year>2018</year>
          <month>01</month>
          <day>15</day>
          <volume>34</volume>
          <issue>2</issue>
          <fpage>319</fpage>
          <lpage>320</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28968749"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btx572</pub-id>
          <pub-id pub-id-type="medline">28968749</pub-id>
          <pub-id pub-id-type="pii">4124859</pub-id>
          <pub-id pub-id-type="pmcid">PMC5860203</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nishio</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sugiyama</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Yakami</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ueno</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kubo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kuroda</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Togashi</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Computer-aided diagnosis of lung nodule classification between benign nodule, primary lung cancer, and metastatic lung cancer at different image size using deep convolutional neural network with transfer learning</article-title>
          <source>PLoS One</source>
          <year>2018</year>
          <volume>13</volume>
          <issue>7</issue>
          <fpage>e0200721</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0200721"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0200721</pub-id>
          <pub-id pub-id-type="medline">30052644</pub-id>
          <pub-id pub-id-type="pii">PONE-D-18-07539</pub-id>
          <pub-id pub-id-type="pmcid">PMC6063408</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>da Silva</surname>
              <given-names>GLF</given-names>
            </name>
            <name name-style="western">
              <surname>Valente</surname>
              <given-names>TLA</given-names>
            </name>
            <name name-style="western">
              <surname>Silva</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>de Paiva</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Gattass</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Convolutional neural network-based PSO for lung nodule false positive reduction on CT images</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2018</year>
          <month>08</month>
          <volume>162</volume>
          <fpage>109</fpage>
          <lpage>118</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2018.05.006</pub-id>
          <pub-id pub-id-type="medline">29903476</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(17)30438-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ait Skourt</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>El Hassani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Majda</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Lung CT image segmentation using deep neural networks</article-title>
          <source>Procedia Comput Sci</source>
          <year>2018</year>
          <volume>127</volume>
          <fpage>109</fpage>
          <lpage>113</lpage>
          <pub-id pub-id-type="doi">10.1016/j.procs.2018.01.104</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lakshmanaprabu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mohanty</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Shankar</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Arunkumar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ramirez</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Optimal deep learning model for classification of lung cancer on CT images</article-title>
          <source>Future Gen Comput Syst</source>
          <year>2019</year>
          <month>03</month>
          <volume>92</volume>
          <fpage>374</fpage>
          <lpage>382</lpage>
          <pub-id pub-id-type="doi">10.1016/j.future.2018.10.009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Automated pulmonary nodule detection in CT images using deep convolutional neural networks</article-title>
          <source>Pattern Recognition</source>
          <year>2019</year>
          <month>01</month>
          <volume>85</volume>
          <fpage>109</fpage>
          <lpage>119</lpage>
          <pub-id pub-id-type="doi">10.1016/j.patcog.2018.07.031</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Trott</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <source>The Perfect Score script</source>
          <year>2017</year>
          <access-date>2020-05-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.kaggle.com/olegtrott/the-perfect-score-script">https://www.kaggle.com/olegtrott/the-perfect-score-script</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>IS</given-names>
            </name>
          </person-group>
          <article-title>Framing the challenges of artificial intelligence in medicine</article-title>
          <source>BMJ Qual Saf</source>
          <year>2019</year>
          <month>03</month>
          <volume>28</volume>
          <issue>3</issue>
          <fpage>238</fpage>
          <lpage>241</lpage>
          <pub-id pub-id-type="doi">10.1136/bmjqs-2018-008551</pub-id>
          <pub-id pub-id-type="medline">30291179</pub-id>
          <pub-id pub-id-type="pii">bmjqs-2018-008551</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brain</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Webb</surname>
              <given-names>GI</given-names>
            </name>
          </person-group>
          <source>On the effect of data set size on bias and variance in classification learning</source>
          <year>1999</year>
          <access-date>2020-07-12</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pdfs.semanticscholar.org/6daf/14076a7ad2c4b4f1a8eb28778b9c641777e7.pdf">https://pdfs.semanticscholar.org/6daf/14076a7ad2c4b4f1a8eb28778b9c641777e7.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
