<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v22i3e17695</article-id>
      <article-id pub-id-type="pmid">32181751</article-id>
      <article-id pub-id-type="doi">10.2196/17695</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Identifying Lung Cancer Risk Factors in the Elderly Using Deep Neural Networks: Quantitative Analysis of Web-Based Survey Data</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Brown</surname>
            <given-names>Anderson</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Clinton</surname>
            <given-names>William</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Songjing</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Institute of Medical Information and Library</institution>
            <institution>Chinese Academy of Medical Sciences / Peking Union Medical College</institution>
            <addr-line>No 3, Yabao Road, Chaoyang District</addr-line>
            <addr-line>Beijing</addr-line>
            <country>China</country>
            <phone>86 01052328761</phone>
            <email>chen.songjing@imicams.ac.cn</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6409-8938</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>Sizhu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6758-6259</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Institute of Medical Information and Library</institution>
        <institution>Chinese Academy of Medical Sciences / Peking Union Medical College</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Songjing Chen <email>chen.songjing@imicams.ac.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>3</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>17</day>
        <month>3</month>
        <year>2020</year>
      </pub-date>
      <volume>22</volume>
      <issue>3</issue>
      <elocation-id>e17695</elocation-id>
      <history>
        <date date-type="received">
          <day>4</day>
          <month>1</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>18</day>
          <month>1</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>19</day>
          <month>1</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>22</day>
          <month>1</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Songjing Chen, Sizhu Wu. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 17.03.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://www.jmir.org/2020/3/e17695/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Lung cancer is one of the most dangerous malignant tumors, with the fastest-growing morbidity and mortality, especially in the elderly. With a rapid growth of the elderly population in recent years, lung cancer prevention and control are increasingly of fundamental importance, but are complicated by the fact that the pathogenesis of lung cancer is a complex process involving a variety of risk factors.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed at identifying key risk factors of lung cancer incidence in the elderly and quantitatively analyzing these risk factors’ degree of influence using a deep learning method.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Based on Web-based survey data, we integrated multidisciplinary risk factors, including behavioral risk factors, disease history factors, environmental factors, and demographic factors, and then preprocessed these integrated data. We trained deep neural network models in a stratified elderly population. We then extracted risk factors of lung cancer in the elderly and conducted quantitative analyses of the degree of influence using the deep neural network models.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The proposed model quantitatively identified risk factors based on 235,673 adults. The proposed deep neural network models of 4 groups (age ≥65 years, women ≥65 years old, men ≥65 years old, and the whole population) achieved good performance in identifying lung cancer risk factors, with accuracy ranging from 0.927 (95% CI 0.223-0.525; <italic>P</italic>=.002) to 0.962 (95% CI 0.530-0.751; <italic>P</italic>=.002) and the area under curve ranging from 0.913 (95% CI 0.564-0.803) to 0.931(95% CI 0.499-0.593). Smoking frequency was the leading risk factor for lung cancer in men 65 years and older. Time since quitting and smoking at least 100 cigarettes in their lifetime were the main risk factors for lung cancer in women 65 years and older. Men 65 years and older had the highest lung cancer incidence among the stratified groups, particularly non–small cell lung cancer incidence. Lung cancer incidence decreased more obviously in men than in women with smoking rate decline.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study demonstrated a quantitative method to identify risk factors of lung cancer in the elderly. The proposed models provided intervention indicators to prevent lung cancer, especially in older men. This approach might be used as a risk factor identification tool to apply in other cancers and help physicians make decisions on cancer prevention.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>deep learning</kwd>
        <kwd>lung cancer</kwd>
        <kwd>risk factors</kwd>
        <kwd>aged</kwd>
        <kwd>primary prevention</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Lung cancer is one of the most dangerous malignant tumors, with the fastest-growing morbidity and mortality, especially in the elderly. With the rapid growth of the elderly population in recent years, lung cancer prevention and control are becoming much more important than ever before. Non–small cell lung cancer (NSCLC) is the most common type of lung cancer [<xref ref-type="bibr" rid="ref1">1</xref>].</p>
        <p>Lung cancer pathogenesis is a complex process involving various risk factors. Factors such as smoking [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>], secondhand smoke [<xref ref-type="bibr" rid="ref4">4</xref>], high levels of air pollution exposure [<xref ref-type="bibr" rid="ref5">5</xref>], and drinking water that has a high level of arsenic [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>] can increase the risk of occurrence of lung cancer. The relationship between these risk factors and lung cancer incidence is an urgent research problem.</p>
        <p>In high-income countries, a combination of early diagnosis, screening, and treatment has been effective in increasing population-based survival for certain cancers [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. Many lung cancer screening-related studies have been conducted recently. In the United States, the National Lung Screening Trial was conducted to investigate the possibility that low-dose computed tomography (CT) could reduce lung cancer mortality [<xref ref-type="bibr" rid="ref11">11</xref>]. Zahnd and Eberth found that use of CT screening was higher than in earlier estimates using 2017 Behavioral Risk Factor Surveillance System (BRFSS) survey data [<xref ref-type="bibr" rid="ref12">12</xref>]. The US Preventive Services Task Force recommended annual screening of individuals at high risk of lung cancer aged 55 to 80 years who have a 30–pack-year smoking history and currently smoke or had quit within the past 15 years [<xref ref-type="bibr" rid="ref13">13</xref>]. Berkowitz and colleagues used 2012 BRFSS data to develop multilevel small-area estimate mixed models to generate county-level estimates for 6 smoking status categories (current, some days, every day, former, ever, and never) [<xref ref-type="bibr" rid="ref14">14</xref>].</p>
        <p>Machine learning algorithms are being used more widely for lung cancer screening, detection, diagnosis, and other related research. Luna and colleagues used random forest as an accurate machine learning method to identify known and new predictors of symptomatic radiation pneumonitis, which is a radiotherapy dose-limiting toxicity for locally advanced NSCLC [<xref ref-type="bibr" rid="ref15">15</xref>]. Palani and Venkatalakshmi used a fuzzy clustering method to predict lung cancer through continuous monitoring using a new internet of things and to improve health care by providing medical instructions [<xref ref-type="bibr" rid="ref16">16</xref>]. A K-means clustering algorithm, based initially on 400 cancer and non–cancer patients’ data, was developed to identify relevant and nonrelevant lung cancer data for early detection of lung cancer [<xref ref-type="bibr" rid="ref17">17</xref>]. Liu and colleagues used multivariable logistic regression to assess the relationship between body mass index and respiratory conditions, asthma, and chronic obstructive pulmonary disease (COPD) based on BRFSS data [<xref ref-type="bibr" rid="ref18">18</xref>]. A series of machine learning methods were applied to classify lung cancer patients’ survival, including linear regression, decision trees, gradient boosting machines, support vector machines, and a custom ensemble [<xref ref-type="bibr" rid="ref19">19</xref>]. Deep learning methods were previously rarely used to identify lung cancer risk factors, but their use has become more common recently. Cha and colleagues studied a deep convolutional neural network model to detect operable lung cancer with chest radiographs [<xref ref-type="bibr" rid="ref20">20</xref>]. Deep learning algorithms might aid fully automated lung cancer detection even at very low effective radiation doses of 0.11 mSv [<xref ref-type="bibr" rid="ref21">21</xref>]. Hosny and colleagues provided evidence that a convolutional neural network might be used for mortality risk stratification based on standard-of-care CT images from NSCLC patients [<xref ref-type="bibr" rid="ref22">22</xref>].</p>
      </sec>
      <sec>
        <title>Objective</title>
        <p>This study aimed at identifying key risk factors of lung cancer incidence in a stratified elderly population and quantitatively analyzing the risk factors’ degree of influence using a deep neural network (DNN) method. Using Web-based survey data, we focused on multidisciplinary risk factors, such as smoking habit, disease history, radiation exposure, behavioral risk, environmental risk, and medical demographics. Our main research problems were how to find the leading causative factors of lung cancer incidence from complex related risk factors and to quantitatively analyze their degree of influence. Our results could help physicians in preventing lung cancer and taking effective measures for early detection.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Source</title>
        <p>We obtained lung cancer risk factors from the BRFSS [<xref ref-type="bibr" rid="ref23">23</xref>], an open access source from the US Centers for Disease Control and Prevention. BRFSS collects survey data from US residents about their health-related risk behaviors, chronic health conditions, use of preventive services, and so on. In this study, we used lung cancer behavioral health risk data of 235,673 adults from all 50 US states between 1996 and 2017. The flowchart in <xref rid="figure1" ref-type="fig">Figure 1</xref> shows the data selection process.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Data selection flowchart. BRFSS: Behavioral Risk Factor Surveillance System.</p>
          </caption>
          <graphic xlink:href="jmir_v22i3e17695_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Lung cancer has many causative factors, including age 65 years and older, body mass index, education, smoking habit, personal history of cancer, family history of cancer, CT or computerized axial tomography (CAT) scan, asthma history, and COPD history. <xref ref-type="table" rid="table1">Table 1</xref> lists some relevant survey questions from the BRFSS questionnaire that we used to collect data for this study.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Lung cancer risk factors assessed by the Behavioral Risk Factor Surveillance System questionnaire.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="350"/>
            <col width="650"/>
            <thead>
              <tr valign="top">
                <td>Risk factors</td>
                <td>Description</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Age</td>
                <td>Age ≥65 years? (yes/no)</td>
              </tr>
              <tr valign="top">
                <td>Body mass index</td>
                <td>Level 1: &#60;18.5 kg/m<sup>2</sup>; 2: 18.5-24.9 kg/m<sup>2</sup>; 3: 25.0-29.9 kg/m<sup>2</sup>; 4: ≥30.0 kg/m<sup>2</sup></td>
              </tr>
              <tr valign="top">
                <td>Education</td>
                <td>Level of education completed (level 1: Did not graduate from high school; 2: Graduated from high school; 3: Attended postsecondary or technical school; 4: Graduated from postsecondary or technical school)</td>
              </tr>
              <tr valign="top">
                <td>Smoked at least 100 cigarettes</td>
                <td>Smoked at least 100 cigarettes in your entire life (yes/no; 1 pack contains 20 cigarettes)</td>
              </tr>
              <tr valign="top">
                <td>Smoking frequency</td>
                <td>Level 1: Every day; 2: Some days; 3: Not at all</td>
              </tr>
              <tr valign="top">
                <td>Smoking start age</td>
                <td>How old were you when you first started to smoke cigarettes regularly? (Age in years)</td>
              </tr>
              <tr valign="top">
                <td>Smoking intensity</td>
                <td>How many cigarettes do you smoke each day? (Number of cigarettes/day)</td>
              </tr>
              <tr valign="top">
                <td>Smoking quit attempts</td>
                <td>During the past 12 months, have you stopped smoking for 1 day or longer? (yes/no)</td>
              </tr>
              <tr valign="top">
                <td>Time since quitting</td>
                <td>How long has it been since you last smoked a cigarette? (1: Within the past month; 2: Within the past 3 months; 3: Within the past 6 months; 4: Within the past year; 5: Within the past 5 years; 6: Within the past 10 years; 7: 10 years or more; 8: Never smoked regularly)</td>
              </tr>
              <tr valign="top">
                <td>E-cigarette use</td>
                <td>Have you ever used an e-cigarette or other electronic vaping product, even just one time? (yes/no)</td>
              </tr>
              <tr valign="top">
                <td>E-cigarette use frequency</td>
                <td>Do you now use e-cigarettes or other electronic vaping products every day, some days, or not at all? (1: Every day; 2: Some days; 3: Not at all)</td>
              </tr>
              <tr valign="top">
                <td>Chronic obstructive pulmonary disease (COPD) history</td>
                <td>History of COPD (yes/no)</td>
              </tr>
              <tr valign="top">
                <td>Asthma history</td>
                <td>History of asthma (yes/no)</td>
              </tr>
              <tr valign="top">
                <td>Cancer history</td>
                <td>Personal history of cancer (yes/no)</td>
              </tr>
              <tr valign="top">
                <td>Family history of cancer</td>
                <td>Family history of cancer (yes/no)</td>
              </tr>
              <tr valign="top">
                <td>Computed tomography (CT) or computerized axial tomography (CAT) scan</td>
                <td>In the last 12 months, did you have a CT or CAT scan? (yes/no)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>Participants who were 65 years and older accounted for about 35.01% (82,503/235,673) of the survey population and those aged 18 to 64 years accounted for 64.99% (153,170/235,673). By sex, 53.99% (127,262/235,673) were women and 46.01% (108,411/235,673) were men.</p>
        <p>We derived environmental risk factors from the open access website of the US Environmental Protection Agency [<xref ref-type="bibr" rid="ref24">24</xref>], including air pollutants and drinking water. According to the investigation date, we linked environmental data with risk factors from the BRFSS.</p>
      </sec>
      <sec>
        <title>Data Analysis</title>
        <sec>
          <title>Overview</title>
          <p>In this study, we employed a DNN model to identify risk factors for lung cancer in the elderly. The DNN model had a multiple-layer structure and powerful data expression ability. In particular, in training models based on the large dataset, DNN had high calculation accuracy. First, we integrated the data on medical demographics, smoking habit, disease history, radiation exposure, behavioral risk, and other aspects. Second, since the number of cases of lung cancer was much lower than that of non–lung cancers, we balanced the data. Then we preprocessed these balanced data. Third, we trained DNN models by leveraging the stratified data of the elderly population. We extracted the stratified risk factors through DNN models. Fourth, we developed a quantitative analysis of the degree of effect of the risk factors in elderly patients. Therefore, the whole study comprised 4 sections: data integration, data balancing and preprocessing, training of DNN models, and quantitative analysis of risk factors, as <xref rid="figure2" ref-type="fig">Figure 2</xref> shows.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Schematic diagram of lung cancer risk factor identification in the elderly. DNN: deep neural network.</p>
            </caption>
            <graphic xlink:href="jmir_v22i3e17695_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Data Integration</title>
          <p>Lung cancer incidence is caused by multiple risk factors [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref27">27</xref>], particularly in the elderly [<xref ref-type="bibr" rid="ref28">28</xref>]. We integrated these risk factors, including medical demographics, smoking, disease history, radiation exposure, behavioral risk, and environmental risk. Medical demographic factors were age, sex, body mass index, and education level. Smoking factors were smoking intensity, age when starting to smoke, smoking frequency, time since quitting, e-cigarette use, secondhand smoke exposure, and other smoking habits. Disease history referred to COPD history, asthma history, personal cancer history, and family history of cancer. Radiation exposure involved radiotherapy of the breast or chest, CT or CAT medical imaging examination, and occupational exposure to asbestos, radon, and arsenic. We also took into account dietary and exercise habits and other behavioral risk factors.</p>
        </sec>
        <sec>
          <title>Data Balancing and Preprocessing</title>
          <p>The ratio of lung cancer to non–lung cancer cases was about 1:115. When studying the pathogenesis of lung cancer, this situation could cause a data imbalance problem. Therefore, we used the synthetic minority oversampling technique (SMOTE) [<xref ref-type="bibr" rid="ref29">29</xref>] to solve the imbalance problem. SMOTE is based on the K-nearest neighbor algorithm to simulate the minority sample. We then added these simulated samples to the whole dataset.</p>
          <p>At the same time, the integrated data had vacancy value, incompleteness, and other problems. We therefore preprocessed the data using techniques such as vacancy value filling and noise data smoothing. We used multiple imputation [<xref ref-type="bibr" rid="ref30">30</xref>] to fill in missing values. We conducted singular value decomposition [<xref ref-type="bibr" rid="ref31">31</xref>] to reduce data noise in the data preprocessing stage.</p>
          <p>We divided the preprocessed data into 4 groups: those aged 65 years and older (age ≥65 years), women aged 65 years and older (women ≥65 years), men aged 65 years and older (men ≥65 years), and the whole population.</p>
        </sec>
        <sec>
          <title>Deep Neural Network Model Training</title>
          <p>By leveraging the weights of the DNN models, we quantified the degree of influence of risk factors on lung cancer incidence in the elderly (<xref rid="figure3" ref-type="fig">Figure 3</xref>). First, we converted the data format into hierarchical data format version 5 (HDF5) [<xref ref-type="bibr" rid="ref32">32</xref>] in the 4 stratified groups (age ≥65 years, women ≥65 years, men ≥65 years, and the whole group) separately. HDF5 is recognized by Convolutional Architecture for Fast Feature Embedding (Caffe) [<xref ref-type="bibr" rid="ref33">33</xref>], an open source general deep learning framework. Second, we used the Caffe framework to train DNN models based on the stratified groups in sequence. We input integrated data through an input layer, and then computed the weight values of different risk factors in a hidden layer. We obtained key risk factors using weight values through the output layer of the DNN model. Third, we extracted different risk factors of the stratified groups according to their DNN models.</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Deep learning model training process. DNN: deep neural network; HDF5: hierarchical data format version 5.</p>
            </caption>
            <graphic xlink:href="jmir_v22i3e17695_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>The DNN model of the group aged 65 years and older consisted of 3 layers: the input layer, hidden layer, and output layer. This model included 1 input layer, 3 hidden layers, and 1 output layer. Layer-to-layer was fully connected. In other words, any neuron in the <italic>i</italic>th layer must be connected to any neuron in the <italic>(i+1)</italic>th layer. Therefore, there was a linear relationship where <italic>z</italic> = ∑<italic>w<sub>i</sub>x<sub>i</sub></italic> + <italic>b</italic>, plus an activation function, σ(<italic>z</italic>). We used a rectified linear unit function, given in Equation 1 (<xref rid="figure4" ref-type="fig">Figure 4</xref>), as an activation function to improve model expression ability. We used 10-fold cross-validation to test algorithm accuracy. We divided the data of the group aged 65 years and older into 10 parts. We rotated them to use 9 of them as a training dataset and 1 as a test dataset for DNN model training.</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>Data analysis equations.</p>
            </caption>
            <graphic xlink:href="jmir_v22i3e17695_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>The output results α<italic><sup>L</sup></italic> of the DNN model can be deduced from Equation 2 (<xref rid="figure4" ref-type="fig">Figure 4</xref>), where W is the weight matrix between the hidden layer and the output layer, which represents the influence of risk factors on lung cancer incidence; L is the number of layers and variable <italic>l</italic> is 2 to L; and b is the bias vector. The numbers of input nodes and output nodes relied on the number of input and output factors, and the hidden-layer number was determined by data size. We set a value of 30 for the input nodes, 3 for the hidden layers, and 9 for the output nodes. In this way, we constructed the DNN model of the group aged 65 years and older. We used the same network structure to train the DNN models of the other 3 stratified groups separately.</p>
        </sec>
        <sec>
          <title>Risk Factor Quantitative Analysis</title>
          <p>We normalized the weight (<italic>w</italic>) using Equation 3 (<xref rid="figure4" ref-type="fig">Figure 4</xref>) to extract key risk factors of lung cancer occurrence. The value of normalized weight (<italic>w</italic><sub>Normalized</sub>) was between 0 and 1. <italic>w</italic><sub>Min</sub> is the minimum value of weight, and <italic>w</italic><sub>Max</sub> is the maximum value of weight. We developed a quantitative analysis of different risk factors in the 4 groups. Because weights represented the degree of influence of risk factors on lung cancer occurrence, we compared the weights of risk factors to identify targeted factors among the 4 stratified groups.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Risk Factor Weights</title>
        <p><xref rid="figure5" ref-type="fig">Figure 5</xref> shows the weights of risk factors in the 4 stratified groups obtained using DNN models. Though leveraging weights of DNN models, we quantitatively analyzed the degree of the risk factors’ influence on lung cancer incidence in the elderly. <xref ref-type="table" rid="table2">Table 2</xref> shows the values of weights and odds ratios (95% CI) of these main risk factors.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Normalized weights of risk factors in the stratified groups. BMI: body mass index; CAT: computerized axial tomography; COPD: chronic obstructive pulmonary disease; CT: computed tomography; PM2.5: fine particulate matter with a diameter ≤2.5 μm.</p>
          </caption>
          <graphic xlink:href="jmir_v22i3e17695_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Normalized weight values and odds ratios (95% CI) of the main risk factors in the 4 population groups.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="160"/>
            <col width="60"/>
            <col width="150"/>
            <col width="60"/>
            <col width="150"/>
            <col width="0"/>
            <col width="60"/>
            <col width="150"/>
            <col width="0"/>
            <col width="60"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td rowspan="2">Risk factors</td>
                <td colspan="2">Population aged ≥65 years</td>
                <td colspan="3">Men aged ≥65 years</td>
                <td colspan="3">Women aged ≥65 years</td>
                <td colspan="2">All age groups</td>
              </tr>
              <tr valign="top">
                <td>Weight</td>
                <td>Odds ratio (95% CI)</td>
                <td>Weight</td>
                <td>Odds ratio (95% CI)</td>
                <td colspan="2">Weight</td>
                <td>Odds ratio (95% CI)</td>
                <td colspan="2">Weight</td>
                <td>Odds ratio (95% CI)</td>
              </tr>
              <tr valign="top">
                <td colspan="11">
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Time since quitting</td>
                <td>0.21</td>
                <td>1.422 (0.806-1.095)</td>
                <td>0.13</td>
                <td>1.587 (0.776-0.998)</td>
                <td colspan="2">0.20</td>
                <td>1.590 (0.927-1.358)</td>
                <td colspan="2">0.009</td>
                <td>1.109 (0.993-1.322)</td>
              </tr>
              <tr valign="top">
                <td>Smoking frequency</td>
                <td>0.11</td>
                <td>1.312 (0.796-0.998)</td>
                <td>0.18</td>
                <td>1.625 (0.866-1.097)</td>
                <td colspan="2">0.16</td>
                <td>1.536 (1.106-1.427)</td>
                <td colspan="2">0.14</td>
                <td>1.370 (1.352-1.701)</td>
              </tr>
              <tr valign="top">
                <td>Cancer history</td>
                <td>0.099</td>
                <td>1.295 (0.876-1.027)</td>
                <td>0.09</td>
                <td>1.387 (1.239-1.667)</td>
                <td colspan="2">0.11</td>
                <td>1.442 (0.951-1.356)</td>
                <td colspan="2">0.09</td>
                <td>1.271 (0.852-1.201)</td>
              </tr>
              <tr valign="top">
                <td>Smoking quit attempts</td>
                <td>0.091</td>
                <td>1.253 (0.933-1.201)</td>
                <td>0.06</td>
                <td>1.273 (1.413-1.702)</td>
                <td colspan="2">0.07</td>
                <td>1.368 (1.127-1.406)</td>
                <td colspan="2">0.20</td>
                <td>1.405 (0.995-1.381)</td>
              </tr>
              <tr valign="top">
                <td>Lifetime smoking of ≤100 cigarettes</td>
                <td>0.081</td>
                <td>1.239 (1.336-1.587)</td>
                <td>0.11</td>
                <td>1.506 (0.681-0.937)</td>
                <td colspan="2">0.18</td>
                <td>1.588 (1.237-1.601)</td>
                <td colspan="2">0.16</td>
                <td>1.387 (1.225-1.611)</td>
              </tr>
              <tr valign="top">
                <td>Asthma history</td>
                <td>0.08</td>
                <td>1.303 (1.029-1.403)</td>
                <td>0.005</td>
                <td>1.095 (0.962-1.329)</td>
                <td colspan="2">0.07</td>
                <td>1.381 (0.953-1.317)</td>
                <td colspan="2">0.007</td>
                <td>1.112 (0.961-1.406)</td>
              </tr>
              <tr valign="top">
                <td>Radiation</td>
                <td>0.08</td>
                <td>1.224 (1.550-1.781)</td>
                <td>0.09</td>
                <td>1.291 (0.983-1.307)</td>
                <td colspan="2">0.12</td>
                <td>1.453 (1.302-1.759)</td>
                <td colspan="2">0.03</td>
                <td>1.190 (0.952-1.357)</td>
              </tr>
              <tr valign="top">
                <td>E-cigarette use</td>
                <td>0.023</td>
                <td>1.025 (0.766-0.934)</td>
                <td>0.12</td>
                <td>1.539 (1.112-1.406)</td>
                <td colspan="2">0.005</td>
                <td>1.135 (0.897-1.309)</td>
                <td colspan="2">0.074</td>
                <td>1.239 (0.851-1.307)</td>
              </tr>
              <tr valign="top">
                <td>Physical activity</td>
                <td>0.023</td>
                <td>1.132 (0.983-1.246)</td>
                <td>0.01</td>
                <td>1.170 (0.851-1.209)</td>
                <td colspan="2">0.03</td>
                <td>1.280 (0.991-1.308)</td>
                <td colspan="2">0.08</td>
                <td>1.268 (1.131-1.670)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Effect of Risk Factors on Lung Cancer</title>
        <p>Those aged 65 years and older were more sensitive to how long ago former smokers had quit and smoking frequency, which were related to smoking. This correlation was more obvious in men aged 65 years and older. Those aged 65 years and older who had quit smoking for a short time or smoked more every day were prone to lung cancer.</p>
        <p>Smoking frequency was the leading risk factor for lung cancer in men aged 65 years and older. As <xref ref-type="table" rid="table2">Table 2</xref> shows, the weights of smoking frequency and time since quitting were 0.18 and 0.13, respectively, in this group of men. The weight of smoking frequency was 38.5% higher than the weight of time since quitting. The top 4 risk factors of men aged 65 years and older (smoking frequency, time since quitting, use of e-cigarettes, and having smoked at least 100 cigarettes in their lifetime) were all associated with smoking. These smoking-related risk factors had a greater influence than other risk factors on men who were 65 years and older. Men in this age group who actively quit smoking were more likely to avoid lung cancer.</p>
        <p>Time since quitting and smoking at least 100 cigarettes over their lifetime were the main risk factors for lung cancer occurrence in women aged 65 years and older. As <xref ref-type="table" rid="table2">Table 2</xref> shows, the weight of time since quitting was 0.20 in this group of women, which was 11.1% greater than the weight of having smoked at least 100 cigarettes (0.18). The top 3 relevant risk factors were associated with smoking habit factors in women aged 65 years and older: time since quitting, having smoking at least 100 cigarettes, and smoking frequency. Therefore, smoking-related risk factors had a greater influence than other risk factors on women in this age group.</p>
        <p>Cancer history ranked in the top risk factors in the 4 stratified groups, which may suggest that cancer history played an important role in the incidence of lung cancer [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. Women aged 65 years and older were more sensitive to radiation exposure than were other groups. Physical activity was the fifth risk factor in the whole group.</p>
      </sec>
      <sec>
        <title>Association Between Smoking and Lung Cancer Incidence</title>
        <p>Men aged 65 years and older had the highest lung cancer incidence in these stratified groups, especially the incidence of NSCLC. We compared the incidence rate of lung cancer, NSCLC, and small cell lung cancer among all ages, under 65 years, and 65 years and older. NSCLC incidence in men 65 years and older was 286 cases per 100,000 people between 2011 and 2015, which was higher than that of women aged 65 years and older (203 per 100,000). Therefore, controlling smoking in men age 65 years and older could be more effective in preventing lung cancer.</p>
        <p>Lung cancer incidence decreased much more rapidly in men than in women with a decline in smoking rate, as <xref rid="figure6" ref-type="fig">Figure 6</xref> shows. The smoking rate curve shows that the number of smokers decreased between 1996 and 2015, from 23% to 14% (a decrease of about 39.1 percentage points). Smoking rate has declined continuously in recent years. <xref rid="figure6" ref-type="fig">Figure 6</xref> also shows that the incidence of lung cancer in men declined from 88 per 100,000 in 1996 to 58 per 100,000 in 2015, a reduction of 34.1 percentage points. As a result, lung cancer incidence had decreased along with smoking rate declining in men.</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Relationship between smoking and lung cancer incidence, 1996-2015.</p>
          </caption>
          <graphic xlink:href="jmir_v22i3e17695_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Accuracy of Deep Neural Network Models</title>
        <p><xref ref-type="table" rid="table3">Table 3</xref> summarizes the performance of the 4 DNN models. The proposed models had good accuracy and area under the receiver operating characteristic curve (AUROC), using the whole group as a baseline to reveal lung cancer incidence in elderly patients. Accuracies were 96.2% (95% CI 0.530-0.751, <italic>P</italic>=.002) for age 65 years and older, 94.3% (95% CI 0.459-0.643, <italic>P</italic>=.015) for men 65 years and older, and 93.2% (95% CI 0.437-0.689, <italic>P</italic>=.003) for women 65 years and older, which were higher than the whole group accuracy of 92.7% (95% CI 0.223-0.525, <italic>P</italic>=.002). Moreover, AUROCs were 0.931 (95% CI 0.499-0.593) for age 65 years and older, 0.927 (95% CI 0.506-0.681) for men 65 years and older, and 0.926 (95% CI 0.543-0.782) for women 65 years and older, performing better than the whole group at 0.913 (95% CI 0.564-0.803). This proposal model efficiently output identified risk factors, which was timesaving.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Performance of the 4 DNN models.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="bottom">
                <td>Model</td>
                <td>Accuracy (95% CI)</td>
                <td>AUROC<sup>a</sup> (95% CI)</td>
                <td><italic>P</italic> value<sup>b</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>≥65 years</td>
                <td>0.962 (0.530-0.751)</td>
                <td>0.931(0.499-0.593)</td>
                <td>.002</td>
              </tr>
              <tr valign="top">
                <td>Men ≥65 years</td>
                <td>0.943 (0.459-0.643)</td>
                <td>0.927 (0.506-0.681)</td>
                <td>.015</td>
              </tr>
              <tr valign="top">
                <td>Women ≥65 years</td>
                <td>0.932 (0.437-0.689)</td>
                <td>0.926 (0.543-0.782)</td>
                <td>.003</td>
              </tr>
              <tr valign="top">
                <td>All</td>
                <td>0.927 (0.223-0.525)</td>
                <td>0.913 (0.564-0.803)</td>
                <td>.002</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup><italic>P</italic>&#60;.05 was considered to indicate statistical significance.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>We developed, to our knowledge, the first deep learning classification model to quantitatively identify corresponding risk factors for lung cancer for stratified groups of elderly people. By leveraging the weights of the DNN models, we identified risk factors for lung cancer in the elderly and quantitatively analyzed the risk factors’ degree of influence. The proposed DNN models of 4 groups (age ≥65 years, women ≥65 years, men ≥65 years, and the whole population) achieved good performance in identifying lung cancer risk factors, with accuracy ranging from 0.927 (95% CI 0.223-0.525, <italic>P</italic>=.002) to 0.962 (95% CI 0.530-0.751, <italic>P</italic>=.002) and AUROCs ranging from 0.913 (95% CI 0.564-0.803) to 0.931 (95% CI 0.499-0.593). The proposed models had a fast training speed and high accuracy and efficiency compared with logistic regression [<xref ref-type="bibr" rid="ref18">18</xref>] and previous models for targeted identification of lung cancer risk factors [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref40">40</xref>].</p>
        <p>In recent years, the deep learning method has been applied more frequently in lung cancer detection and prediction due to its advantages of high accuracy and fast computing speed. Hosny and colleagues used deep learning networks to predict mortality risk stratification of patients with NSCLC [<xref ref-type="bibr" rid="ref22">22</xref>]. Cha and colleagues found that a deep learning method had high diagnostic performance in detecting operable lung cancer with chest radiographs [<xref ref-type="bibr" rid="ref20">20</xref>]. The DNN model, which we proposed to extract risk factors, could also be applied to provide intervention indicators for lung cancer prevention and carry out targeted intervention measures.</p>
        <p>Through integrating multidisciplinary data, we the employed the DNN method to identify key lung cancer risk factors in the elderly. We computed quantitative weights of different risk factors in a stratified population to deduce their degrees of influence on lung cancer incidence. Our results showed that DNN models identified specific risk factors of targeted elderly people. People who were 65 years or older were more sensitive to time since quitting and smoking frequency, especially in men in this age group: smoking frequency was the leading causative risk factor for lung cancer in men 65 years and older. Time since quitting and smoking at least 100 cigarettes over a lifetime were the main risk factors for lung cancer in women 65 years and older. Men 65 years and older had the highest lung cancer incidence in these stratified groups. Lung cancer incidence decreased more obviously in men than in women with a decline in smoking rate. Cancer history played an important role in the incidence of lung cancer. Taking part in more physical activities to enhance physical quality might reduce lung cancer incidence [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>]. Smoking-related factors (eg, smoking frequency, time since quitting, smoking at least 100 cigarettes) were important risk factors for lung cancer in elderly patients. Risk factors such as smoking-related factors, exercise, and cancer history were intervention indicators in preventing lung cancer. Tammemagi and colleagues found that smokers aged 65 to 80 years were a high-risk group who might benefit from low-dose CT lung cancer screening [<xref ref-type="bibr" rid="ref43">43</xref>]. Chen and colleagues found that regional application of effective primary cancer prevention strategies on smoking, poor diet, and other modifiable risk factors had a vast potential to reduce the burden of cancer and disparities in China [<xref ref-type="bibr" rid="ref9">9</xref>]. These suggested that interventional measures targeting the main risk factors might be possible to prevent lung cancer occurrence.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>Previously, researchers conducted several models to identify lung cancer risk factors [<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref40">40</xref>]. <xref ref-type="table" rid="table4">Table 4</xref> shows a comparison of our model with previous models. Compared with previous models, our proposed model identified risk factors for lung cancer in the elderly with high accuracy and AUROC. Our model used data from a larger population, more lung cancer occurrence-related risk factors, and a more efficient identification algorithm than previous models. Our DNN models had faster training speeds than previous models when training on the same scale of big data, which could save a lot of time. Moreover, we balanced and preprocessed the data before training the DNN models, which was helpful to improve model accuracy effectively.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Comparison of our model with previous models for identifying lung cancer risk factors.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="90"/>
            <col width="170"/>
            <col width="410"/>
            <col width="90"/>
            <col width="90"/>
            <thead>
              <tr valign="bottom">
                <td>Model</td>
                <td>Population</td>
                <td>Method</td>
                <td>Risk factors</td>
                <td>Accuracy</td>
                <td>AUROC<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Our model</td>
                <td>235,673</td>
                <td>Deep neural network</td>
                <td>As listed in the Results section</td>
                <td>0.927</td>
                <td>0.913</td>
              </tr>
              <tr valign="top">
                <td>Panayiotis, 2016 [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>25,486</td>
                <td>Dynamic Bayesian network</td>
                <td>Demographics, smoking status, family history of cancer, cancer history, comorbidities related to lung cancer, occupational exposures, and low-dose computed tomography screening outcomes</td>
                <td>0.65</td>
                <td>0.75</td>
              </tr>
              <tr valign="bottom">
                <td>Wang, 2019 [<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                <td>961</td>
                <td>Conditional Gaussian Bayesian network</td>
                <td>Age, sex, level of education, region, urbanization, diagnosis-based factors, prior utilization factors, prescription factors</td>
                <td>0.67</td>
                <td>N/A<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Ankit, 2012 [<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>70,132</td>
                <td>Decision tree</td>
                <td>Age, birthplace, cancer grade, diagnostic confirmation, farthest extension of tumor, type of surgery performed, reason for no surgery, order of surgery and radiation therapy, scope of regional lymph node surgery</td>
                <td>0.863</td>
                <td>0.91</td>
              </tr>
              <tr valign="top">
                <td>Xie, 2014 [<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                <td>1703</td>
                <td>Artificial neural network</td>
                <td>41 risk factors: age, education level, marital status, income status, smoking, alcohol drinking, coffee intake, etc</td>
                <td>0.838</td>
                <td>N/A</td>
              </tr>
              <tr valign="top">
                <td>Kaviarasi, 2019 [<xref ref-type="bibr" rid="ref40">40</xref>]</td>
                <td>321</td>
                <td>Gaussian classifier</td>
                <td>Age, sex, radiation sequence with surgery, first malignant primary indicator, radiation, etc</td>
                <td>N/A</td>
                <td>0.881</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>Not available.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Some aspects of our results were similar to the results of these previous studies. In our results, smoking was the leading cause of lung cancer in the elderly. This view was consistent with the reported literature [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref44">44</xref>-<xref ref-type="bibr" rid="ref46">46</xref>]. Nevertheless, we focused on some original findings in stratified groups of older people.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This study had several limitations. First, we mainly focused on modifiable risk factors of lung cancer in the elderly. In the future, we should validate these identified modifiable risk factors using a simulated intervention process to prevent lung cancer. Second, because we used open survey data, we did not obtain the participants’ genetic and dietary factors. We are matching the data to source region now and we will analyze lung cancer risk factors by region in the future.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study demonstrated a quantitative method to identify risk factors for lung cancer in the elderly. The proposed models provided intervention indicators to prevent lung cancer, especially in older men, which could be used with effective intervention methods to reduce lung cancer incidence in the elderly and improve their life quality in their later years. This approach might be used as a risk factor identification tool in other cancers and help physicians make decisions on cancer prevention.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUROC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BRFSS</term>
          <def>
            <p>Behavioral Risk Factor Surveillance System</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">Caffe</term>
          <def>
            <p>Convolutional Architecture for Fast Feature Embedding</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CAT</term>
          <def>
            <p>computerized axial tomography</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">COPD</term>
          <def>
            <p>chronic obstructive pulmonary disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">CT</term>
          <def>
            <p>computed tomography</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">DNN</term>
          <def>
            <p>deep neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">HDF5</term>
          <def>
            <p>hierarchical data format version 5</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">NSCLC</term>
          <def>
            <p>non–small cell lung cancer</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">SMOTE</term>
          <def>
            <p>synthetic minority oversampling technique</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was supported by the General Project on Humanities and Social Science Research of the Ministry of Education of China under grant no 19YJC870002, the National Key R&#38;D Program of China under grant no 2016YFC0901602, and the Medical and Health Technology Innovation Project of the Chinese Academy of Medical Sciences under grant no 2019-I2M-2-002.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>U.S. National Library of Medicine</collab>
          </person-group>
          <source>MedlinePlus. Non-small cell lung cancer</source>
          <year>2019</year>
          <access-date>2019-06-20</access-date>
          <publisher-loc>Bethesda, MD</publisher-loc>
          <publisher-name>U.S. Department of Health and Human Services, National Institutes of Health</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medlineplus.gov/ency/article/007194.htm">https://medlineplus.gov/ency/article/007194.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schuller</surname>
              <given-names>HM</given-names>
            </name>
          </person-group>
          <article-title>The impact of smoking and the influence of other factors on lung cancer</article-title>
          <source>Expert Rev Respir Med</source>
          <year>2019</year>
          <month>08</month>
          <volume>13</volume>
          <issue>8</issue>
          <fpage>761</fpage>
          <lpage>769</lpage>
          <pub-id pub-id-type="doi">10.1080/17476348.2019.1645010</pub-id>
          <pub-id pub-id-type="medline">31311354</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>LY</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yoo</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>C</given-names>
            </name>
            <collab>Scientific Committee‚ Korean Academy of Tuberculosis and Respiratory Diseases</collab>
          </person-group>
          <article-title>Lung cancer risk and cigarette smoking, lung tuberculosis according to histologic type and gender in a population based case-control study</article-title>
          <source>Lung Cancer</source>
          <year>2010</year>
          <month>04</month>
          <volume>68</volume>
          <issue>1</issue>
          <fpage>20</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1016/j.lungcan.2009.05.017</pub-id>
          <pub-id pub-id-type="medline">19545930</pub-id>
          <pub-id pub-id-type="pii">S0169-5002(09)00318-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hahn</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hooper</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Riker</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Butler</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Rademacher</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wiggins</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rayens</surname>
              <given-names>MK</given-names>
            </name>
          </person-group>
          <article-title>Lung cancer worry and home screening for radon and secondhand smoke in renters</article-title>
          <source>J Environ Health</source>
          <year>2017</year>
          <volume>79</volume>
          <issue>6</issue>
          <fpage>8</fpage>
          <lpage>13</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29135198"/>
          </comment>
          <pub-id pub-id-type="medline">29135198</pub-id>
          <pub-id pub-id-type="pmcid">PMC5754926</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>An evidence-based assessment for the association between long-term exposure to outdoor air pollution and the risk of lung cancer</article-title>
          <source>Eur J Cancer Prev</source>
          <year>2016</year>
          <month>05</month>
          <volume>25</volume>
          <issue>3</issue>
          <fpage>163</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1097/CEJ.0000000000000158</pub-id>
          <pub-id pub-id-type="medline">25757194</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lamm</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Boroje</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ferdosi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Lung cancer risk and low (50 g/L) drinking water arsenic levels for US counties (2009-2013)-a negative association</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2018</year>
          <month>06</month>
          <day>07</day>
          <volume>15</volume>
          <issue>6</issue>
          <fpage>1</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.mdpi.com/resolver?pii=ijerph15061200"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph15061200</pub-id>
          <pub-id pub-id-type="medline">29880761</pub-id>
          <pub-id pub-id-type="pii">ijerph15061200</pub-id>
          <pub-id pub-id-type="pmcid">PMC6025287</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Calcium and magnesium in drinking-water and risk of death from lung cancer in women</article-title>
          <source>Magnes Res</source>
          <year>2012</year>
          <volume>25</volume>
          <issue>3</issue>
          <fpage>112</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jle.com/medline.md?issn=0953-1424&#38;vol=25&#38;iss=3&#38;page=112"/>
          </comment>
          <pub-id pub-id-type="doi">10.1684/mrh.2012.0318</pub-id>
          <pub-id pub-id-type="medline">23073359</pub-id>
          <pub-id pub-id-type="pii">mrh.2012.0318</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allemani</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Matsuda</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Di Carlo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Harewood</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Matz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nikšić</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bonaventure</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Valkov</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Estève</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ogunbiyi</surname>
              <given-names>OJ</given-names>
            </name>
            <name name-style="western">
              <surname>Azevedo E Silva</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Eser</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Engholm</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Stiller</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Monnereau</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Woods</surname>
              <given-names>RR</given-names>
            </name>
            <name name-style="western">
              <surname>Visser</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>GH</given-names>
            </name>
            <name name-style="western">
              <surname>Aitken</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Weir</surname>
              <given-names>HK</given-names>
            </name>
            <name name-style="western">
              <surname>Coleman</surname>
              <given-names>MP</given-names>
            </name>
            <collab>CONCORD Working Group</collab>
          </person-group>
          <article-title>Global surveillance of trends in cancer survival 2000-14 (CONCORD-3): analysis of individual records for 37 513 025 patients diagnosed with one of 18 cancers from 322 population-based registries in 71 countries</article-title>
          <source>Lancet</source>
          <year>2018</year>
          <month>03</month>
          <day>17</day>
          <volume>391</volume>
          <issue>10125</issue>
          <fpage>1023</fpage>
          <lpage>1075</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29395269"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(17)33326-3</pub-id>
          <pub-id pub-id-type="medline">29395269</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(17)33326-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC5879496</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Islami</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Bray</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jemal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Disparities by province, age, and sex in site-specific cancer burden attributable to 23 potentially modifiable risk factors in China: a comparative risk assessment</article-title>
          <source>Lancet Glob Health</source>
          <year>2019</year>
          <month>02</month>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>e257</fpage>
          <lpage>e269</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2214-109X(18)30488-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S2214-109X(18)30488-1</pub-id>
          <pub-id pub-id-type="medline">30683243</pub-id>
          <pub-id pub-id-type="pii">S2214-109X(18)30488-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lobach</surname>
              <given-names>DF</given-names>
            </name>
            <name name-style="western">
              <surname>Johns</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Halpenny</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Saunders</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Brzozowski</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Del Fiol</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Berry</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Braun</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Finn</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wolfe</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Abrahm</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Cooley</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Increasing complexity in rule-based clinical decision support: the symptom assessment and management intervention</article-title>
          <source>JMIR Med Inform</source>
          <year>2016</year>
          <month>11</month>
          <day>08</day>
          <volume>4</volume>
          <issue>4</issue>
          <fpage>e36</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://medinform.jmir.org/2016/4/e36/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/medinform.5728</pub-id>
          <pub-id pub-id-type="medline">27826132</pub-id>
          <pub-id pub-id-type="pii">v4i4e36</pub-id>
          <pub-id pub-id-type="pmcid">PMC5120240</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>National Lung Screening Trial Research Team</collab>
            <name name-style="western">
              <surname>Aberle</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Adams</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Berg</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Black</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Clapp</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Fagerstrom</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Gareen</surname>
              <given-names>IF</given-names>
            </name>
            <name name-style="western">
              <surname>Gatsonis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Marcus</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Sicks</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Reduced lung-cancer mortality with low-dose computed tomographic screening</article-title>
          <source>N Engl J Med</source>
          <year>2011</year>
          <month>08</month>
          <day>4</day>
          <volume>365</volume>
          <issue>5</issue>
          <fpage>395</fpage>
          <lpage>409</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21714641"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMoa1102873</pub-id>
          <pub-id pub-id-type="medline">21714641</pub-id>
          <pub-id pub-id-type="pmcid">PMC4356534</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zahnd</surname>
              <given-names>WE</given-names>
            </name>
            <name name-style="western">
              <surname>Eberth</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Lung cancer screening utilization: a behavioral risk factor surveillance system analysis</article-title>
          <source>Am J Prev Med</source>
          <year>2019</year>
          <month>08</month>
          <volume>57</volume>
          <issue>2</issue>
          <fpage>250</fpage>
          <lpage>255</lpage>
          <pub-id pub-id-type="doi">10.1016/j.amepre.2019.03.015</pub-id>
          <pub-id pub-id-type="medline">31248742</pub-id>
          <pub-id pub-id-type="pii">S0749-3797(19)30165-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moyer</surname>
              <given-names>VA</given-names>
            </name>
            <collab>U.S. Preventive Services Task Force</collab>
          </person-group>
          <article-title>Screening for lung cancer: U.S. Preventive Services Task Force recommendation statement</article-title>
          <source>Ann Intern Med</source>
          <year>2014</year>
          <month>03</month>
          <day>4</day>
          <volume>160</volume>
          <issue>5</issue>
          <fpage>330</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.7326/M13-2771</pub-id>
          <pub-id pub-id-type="medline">24378917</pub-id>
          <pub-id pub-id-type="pii">1809422</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berkowitz</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Richards</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Peipins</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Henley</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Holt</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Multilevel small-area estimation of multiple cigarette smoking status categories using the 2012 Behavioral Risk Factor Surveillance System</article-title>
          <source>Cancer Epidemiol Biomarkers Prev</source>
          <year>2016</year>
          <month>10</month>
          <volume>25</volume>
          <issue>10</issue>
          <fpage>1402</fpage>
          <lpage>1410</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://cebp.aacrjournals.org/cgi/pmidlookup?view=long&#38;pmid=27697795"/>
          </comment>
          <pub-id pub-id-type="doi">10.1158/1055-9965.EPI-16-0244</pub-id>
          <pub-id pub-id-type="medline">27697795</pub-id>
          <pub-id pub-id-type="pii">1055-9965.EPI-16-0244</pub-id>
          <pub-id pub-id-type="pmcid">PMC6369521</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luna</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Chao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Diffenderfer</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Valdes</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chinniah</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cengel</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Solberg</surname>
              <given-names>TD</given-names>
            </name>
            <name name-style="western">
              <surname>Berman</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Simone</surname>
              <given-names>CB</given-names>
            </name>
          </person-group>
          <article-title>Predicting radiation pneumonitis in locally advanced stage II-III non-small cell lung cancer using machine learning</article-title>
          <source>Radiother Oncol</source>
          <year>2019</year>
          <month>04</month>
          <volume>133</volume>
          <fpage>106</fpage>
          <lpage>112</lpage>
          <pub-id pub-id-type="doi">10.1016/j.radonc.2019.01.003</pub-id>
          <pub-id pub-id-type="medline">30935565</pub-id>
          <pub-id pub-id-type="pii">S0167-8140(19)30007-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Palani</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Venkatalakshmi</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>An IoT based predictive modelling for predicting lung cancer using fuzzy cluster based segmentation and classification</article-title>
          <source>J Med Syst</source>
          <year>2018</year>
          <month>12</month>
          <day>18</day>
          <volume>43</volume>
          <issue>2</issue>
          <fpage>21</fpage>
          <pub-id pub-id-type="doi">10.1007/s10916-018-1139-7</pub-id>
          <pub-id pub-id-type="medline">30564924</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10916-018-1139-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Emran</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Jesmin</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mukti</surname>
              <given-names>RF</given-names>
            </name>
            <name name-style="western">
              <surname>Rahman</surname>
              <given-names>MZ</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Early detection of lung cancer risk using data mining</article-title>
          <source>Asian Pac J Cancer Prev</source>
          <year>2013</year>
          <volume>14</volume>
          <issue>1</issue>
          <fpage>595</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://journal.waocp.org/?sid=Entrez:PubMed&#38;id=pmid:23534801&#38;key=2013.14.1.595"/>
          </comment>
          <pub-id pub-id-type="doi">10.7314/apjcp.2013.14.1.595</pub-id>
          <pub-id pub-id-type="medline">23534801</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Pleasants</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Croft</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Lugogo</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ohar</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Heidari</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Strange</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wheaton</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Mannino</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Kraft</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Body mass index, respiratory conditions, asthma, and chronic obstructive pulmonary disease</article-title>
          <source>Respir Med</source>
          <year>2015</year>
          <month>07</month>
          <volume>109</volume>
          <issue>7</issue>
          <fpage>851</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0954-6111(15)00176-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.rmed.2015.05.006</pub-id>
          <pub-id pub-id-type="medline">26006753</pub-id>
          <pub-id pub-id-type="pii">S0954-6111(15)00176-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC4487766</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Abdollahi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Fuqua</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>de Carlo</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Bartholomai</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Balgemann</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>van Berkel</surname>
              <given-names>VH</given-names>
            </name>
            <name name-style="western">
              <surname>Frieboes</surname>
              <given-names>HB</given-names>
            </name>
          </person-group>
          <article-title>Prediction of lung cancer patient survival via supervised machine learning classification techniques</article-title>
          <source>Int J Med Inform</source>
          <year>2017</year>
          <month>12</month>
          <volume>108</volume>
          <fpage>1</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29132615"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2017.09.013</pub-id>
          <pub-id pub-id-type="medline">29132615</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(17)30236-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC5726571</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cha</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>KS</given-names>
            </name>
          </person-group>
          <article-title>Performance of deep learning model in detecting operable lung cancer with chest radiographs</article-title>
          <source>J Thorac Imaging</source>
          <year>2019</year>
          <month>03</month>
          <volume>34</volume>
          <issue>2</issue>
          <fpage>86</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1097/RTI.0000000000000388</pub-id>
          <pub-id pub-id-type="medline">30802232</pub-id>
          <pub-id pub-id-type="pii">00005382-201903000-00003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schwyzer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ferraro</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Muehlematter</surname>
              <given-names>UJ</given-names>
            </name>
            <name name-style="western">
              <surname>Curioni-Fontecedro</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Huellner</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>von Schulthess</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Kaufmann</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Burger</surname>
              <given-names>IA</given-names>
            </name>
            <name name-style="western">
              <surname>Messerli</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Automated detection of lung cancer at ultralow dose PET/CT by deep neural networks - initial results</article-title>
          <source>Lung Cancer</source>
          <year>2018</year>
          <month>12</month>
          <volume>126</volume>
          <fpage>170</fpage>
          <lpage>173</lpage>
          <pub-id pub-id-type="doi">10.1016/j.lungcan.2018.11.001</pub-id>
          <pub-id pub-id-type="medline">30527183</pub-id>
          <pub-id pub-id-type="pii">S0169-5002(18)30628-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hosny</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Parmar</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Coroller</surname>
              <given-names>TP</given-names>
            </name>
            <name name-style="western">
              <surname>Grossmann</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zeleznik</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bussink</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gillies</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mak</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Aerts</surname>
              <given-names>HJWL</given-names>
            </name>
          </person-group>
          <article-title>Deep learning for lung cancer prognostication: a retrospective multi-cohort radiomics study</article-title>
          <source>PLoS Med</source>
          <year>2018</year>
          <month>11</month>
          <volume>15</volume>
          <issue>11</issue>
          <fpage>e1002711</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pmed.1002711"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pmed.1002711</pub-id>
          <pub-id pub-id-type="medline">30500819</pub-id>
          <pub-id pub-id-type="pii">PMEDICINE-D-18-01161</pub-id>
          <pub-id pub-id-type="pmcid">PMC6269088</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>US Centers for Disease Control and Prevention</collab>
          </person-group>
          <source>Behavioral Risk Factor Surveillance System</source>
          <year>2019</year>
          <access-date>2020-01-27</access-date>
          <publisher-name>U.S. Department of Health &#38; Human Services</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/brfss/">https://www.cdc.gov/brfss/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>United States Environmental Protection Agency</collab>
          </person-group>
          <source>Environmental Data database</source>
          <year>2019</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.epa.gov/">https://www.epa.gov/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Samet</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Avila-Tang</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Boffetta</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hannan</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Olivo-Marston</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Thun</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rudin</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Lung cancer in never smokers: clinical epidemiology and environmental risk factors</article-title>
          <source>Clin Cancer Res</source>
          <year>2009</year>
          <month>09</month>
          <day>15</day>
          <volume>15</volume>
          <issue>18</issue>
          <fpage>5626</fpage>
          <lpage>45</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://clincancerres.aacrjournals.org/cgi/pmidlookup?view=long&#38;pmid=19755391"/>
          </comment>
          <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-09-0376</pub-id>
          <pub-id pub-id-type="medline">19755391</pub-id>
          <pub-id pub-id-type="pii">15/18/5626</pub-id>
          <pub-id pub-id-type="pmcid">PMC3170525</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Molina</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Cassivi</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Schild</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Adjei</surname>
              <given-names>AA</given-names>
            </name>
          </person-group>
          <article-title>Non-small cell lung cancer: epidemiology, risk factors, treatment, and survivorship</article-title>
          <source>Mayo Clin Proc</source>
          <year>2008</year>
          <month>05</month>
          <volume>83</volume>
          <issue>5</issue>
          <fpage>584</fpage>
          <lpage>94</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18452692"/>
          </comment>
          <pub-id pub-id-type="doi">10.4065/83.5.584</pub-id>
          <pub-id pub-id-type="medline">18452692</pub-id>
          <pub-id pub-id-type="pii">S0025-6196(11)60735-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC2718421</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jabbour</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>O'Reilly</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yue</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Automated information extraction on treatment and prognosis for non-small cell lung cancer radiotherapy patients: clinical study</article-title>
          <source>JMIR Med Inform</source>
          <year>2018</year>
          <month>02</month>
          <day>01</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>e8</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2018/1/e8/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/medinform.8662</pub-id>
          <pub-id pub-id-type="medline">29391345</pub-id>
          <pub-id pub-id-type="pii">v6i1e8</pub-id>
          <pub-id pub-id-type="pmcid">PMC5814605</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Im</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>HY</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>HK</given-names>
            </name>
            <name name-style="western">
              <surname>Zo</surname>
              <given-names>JI</given-names>
            </name>
            <name name-style="western">
              <surname>Shim</surname>
              <given-names>YM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>HY</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Prevalence of and risk factors for pulmonary complications after curative resection in otherwise healthy elderly patients with early stage lung cancer</article-title>
          <source>Respir Res</source>
          <year>2019</year>
          <month>07</month>
          <day>04</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>136</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://respiratory-research.biomedcentral.com/articles/10.1186/s12931-019-1087-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12931-019-1087-x</pub-id>
          <pub-id pub-id-type="medline">31272446</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12931-019-1087-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC6610954</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chawla</surname>
              <given-names>NV</given-names>
            </name>
            <name name-style="western">
              <surname>Bowyer</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Kegelmeyer</surname>
              <given-names>WP</given-names>
            </name>
          </person-group>
          <article-title>SMOTE: synthetic minority over-sampling technique</article-title>
          <source>J Artif Intell Res</source>
          <year>2002</year>
          <month>06</month>
          <day>01</day>
          <volume>16</volume>
          <issue>6</issue>
          <fpage>321</fpage>
          <lpage>357</lpage>
          <pub-id pub-id-type="doi">10.1613/jair.953</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schafer</surname>
              <given-names>JL</given-names>
            </name>
          </person-group>
          <article-title>Multiple imputation: a primer</article-title>
          <source>Stat Methods Med Res</source>
          <year>1999</year>
          <month>03</month>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="medline">10347857</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kalman</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A singularly valuable decomposition: the SVD of a matrix</article-title>
          <source>Coll Math J</source>
          <year>1996</year>
          <month>01</month>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>2</fpage>
          <pub-id pub-id-type="doi">10.2307/2687269</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>The HDF group</collab>
          </person-group>
          <source>HDF5 format</source>
          <year>2019</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://support.hdfgroup.org/HDF5/">https://support.hdfgroup.org/HDF5/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>Caffe</collab>
          </person-group>
          <source>Caffe deep learning framework</source>
          <year>2019</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://caffe.berkeleyvision.org/">http://caffe.berkeleyvision.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jatoi</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>WF</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Brawley</surname>
              <given-names>OW</given-names>
            </name>
          </person-group>
          <article-title>The history of cancer screening</article-title>
          <source>Curr Problems Surg</source>
          <year>2019</year>
          <month>04</month>
          <volume>56</volume>
          <issue>4</issue>
          <fpage>138</fpage>
          <lpage>163</lpage>
          <pub-id pub-id-type="doi">10.1067/j.cpsurg.2018.12.006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Qiu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Impact of prior cancer history on the overall survival of patients newly diagnosed with cancer: a pan-cancer analysis of the SEER database</article-title>
          <source>Int J Cancer</source>
          <year>2018</year>
          <month>10</month>
          <day>01</day>
          <volume>143</volume>
          <issue>7</issue>
          <fpage>1569</fpage>
          <lpage>1577</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/ijc.31543"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/ijc.31543</pub-id>
          <pub-id pub-id-type="medline">29667174</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Petousis</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>SX</given-names>
            </name>
            <name name-style="western">
              <surname>Aberle</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bui</surname>
              <given-names>AAT</given-names>
            </name>
          </person-group>
          <article-title>Prediction of lung cancer incidence on the low-dose computed tomography arm of the National Lung Screening Trial: a dynamic Bayesian network</article-title>
          <source>Artif Intell Med</source>
          <year>2016</year>
          <month>09</month>
          <volume>72</volume>
          <fpage>42</fpage>
          <lpage>55</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/27664507"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2016.07.001</pub-id>
          <pub-id pub-id-type="medline">27664507</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(16)30106-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC5082434</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Medical expenditure estimation by Bayesian network for lung cancer patients at different severity stages</article-title>
          <source>Comput Biol Med</source>
          <year>2019</year>
          <month>03</month>
          <volume>106</volume>
          <fpage>97</fpage>
          <lpage>105</lpage>
          <pub-id pub-id-type="doi">10.1016/j.compbiomed.2019.01.015</pub-id>
          <pub-id pub-id-type="medline">30708222</pub-id>
          <pub-id pub-id-type="pii">S0010-4825(19)30017-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ankit</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sanchit</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ramanathan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lalith</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Aloi</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Lung cancer survival prediction using ensemble data mining on SEER data</article-title>
          <source>Sci Programming</source>
          <year>2012</year>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>29</fpage>
          <lpage>42</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://journal.waocp.org/?sid=Entrez:PubMed&#38;id=pmid:25556505&#38;key=2014.15.23.10539"/>
          </comment>
          <pub-id pub-id-type="doi">10.3233/SPR-2012-0335</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Lung cancer risk prediction method based on feature selection and artificial neural network</article-title>
          <source>Asian Pac J Cancer Prev</source>
          <year>2014</year>
          <volume>15</volume>
          <issue>23</issue>
          <fpage>10539</fpage>
          <lpage>42</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://journal.waocp.org/?sid=Entrez:PubMed&#38;id=pmid:25556505&#38;key=2014.15.23.10539"/>
          </comment>
          <pub-id pub-id-type="doi">10.7314/apjcp.2014.15.23.10539</pub-id>
          <pub-id pub-id-type="medline">25556505</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaviarasi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gandhi</surname>
              <given-names>RR</given-names>
            </name>
          </person-group>
          <article-title>Accuracy enhanced lung cancer prognosis for improving patient survivability using proposed Gaussian classifier system</article-title>
          <source>J Med Syst</source>
          <year>2019</year>
          <month>05</month>
          <day>24</day>
          <volume>43</volume>
          <issue>7</issue>
          <fpage>201</fpage>
          <pub-id pub-id-type="doi">10.1007/s10916-019-1297-2</pub-id>
          <pub-id pub-id-type="medline">31127444</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10916-019-1297-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Granger</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>McDonald</surname>
              <given-names>CF</given-names>
            </name>
            <name name-style="western">
              <surname>Berney</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Denehy</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Exercise intervention to improve exercise capacity and health related quality of life for patients with Non-small cell lung cancer: a systematic review</article-title>
          <source>Lung Cancer</source>
          <year>2011</year>
          <month>05</month>
          <volume>72</volume>
          <issue>2</issue>
          <fpage>139</fpage>
          <lpage>53</lpage>
          <pub-id pub-id-type="doi">10.1016/j.lungcan.2011.01.006</pub-id>
          <pub-id pub-id-type="medline">21316790</pub-id>
          <pub-id pub-id-type="pii">S0169-5002(11)00032-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arbane</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Tropman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Garrod</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of an early exercise intervention after thoracotomy for non-small cell lung cancer (NSCLC), effects on quality of life, muscle strength and exercise tolerance: randomised controlled trial</article-title>
          <source>Lung Cancer</source>
          <year>2011</year>
          <month>02</month>
          <volume>71</volume>
          <issue>2</issue>
          <fpage>229</fpage>
          <lpage>34</lpage>
          <pub-id pub-id-type="doi">10.1016/j.lungcan.2010.04.025</pub-id>
          <pub-id pub-id-type="medline">20541832</pub-id>
          <pub-id pub-id-type="pii">S0169-5002(10)00215-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tammemägi</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Church</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Hocking</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Silvestri</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Kvale</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Riley</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Commins</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Berg</surname>
              <given-names>CD</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of the lung cancer risks at which to screen ever- and never-smokers: screening rules applied to the PLCO and NLST cohorts</article-title>
          <source>PLoS Med</source>
          <year>2014</year>
          <month>12</month>
          <volume>11</volume>
          <issue>12</issue>
          <fpage>e1001764</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pmed.1001764"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pmed.1001764</pub-id>
          <pub-id pub-id-type="medline">25460915</pub-id>
          <pub-id pub-id-type="pii">PMEDICINE-D-14-01117</pub-id>
          <pub-id pub-id-type="pmcid">PMC4251899</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Wan</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Pathway-based identification of a smoking associated 6-gene signature predictive of lung cancer risk and survival</article-title>
          <source>Artif Intell Med</source>
          <year>2012</year>
          <month>06</month>
          <volume>55</volume>
          <issue>2</issue>
          <fpage>97</fpage>
          <lpage>105</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22326768"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2012.01.001</pub-id>
          <pub-id pub-id-type="medline">22326768</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(12)00014-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC3351561</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Giuliani</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Dirlea</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Selby</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Papadakos</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Abdelmutti</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Eng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Implementation of a novel electronic patient-directed smoking cessation platform for cancer patients: interrupted time series analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>04</month>
          <day>09</day>
          <volume>21</volume>
          <issue>4</issue>
          <fpage>e11735</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/4/e11735/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/11735</pub-id>
          <pub-id pub-id-type="medline">30964445</pub-id>
          <pub-id pub-id-type="pii">v21i4e11735</pub-id>
          <pub-id pub-id-type="pmcid">PMC6477574</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wraith</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mengersen</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Assessing the combined effect of asbestos exposure and smoking on lung cancer: a Bayesian approach</article-title>
          <source>Stat Med</source>
          <year>2007</year>
          <month>02</month>
          <day>28</day>
          <volume>26</volume>
          <issue>5</issue>
          <fpage>1150</fpage>
          <lpage>69</lpage>
          <pub-id pub-id-type="doi">10.1002/sim.2602</pub-id>
          <pub-id pub-id-type="medline">16779874</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
