<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v22i4e15196</article-id>
      <article-id pub-id-type="pmid">32271154</article-id>
      <article-id pub-id-type="doi">10.2196/15196</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Epidemiological Characterization of a Directed and Weighted Disease Network Using Data From a Cohort of One Million Patients: Network Analysis</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Kolostoumpis</surname>
            <given-names>George</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Ko</surname>
            <given-names>Kyungmin</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5736-409X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Lee</surname>
            <given-names>Chae Won</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9380-8230</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Nam</surname>
            <given-names>Sangmin</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6903-6333</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Ahn</surname>
            <given-names>Song Vogue</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2771-6792</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Bae</surname>
            <given-names>Jung Ho</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7669-1213</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Ban</surname>
            <given-names>Chi Yong</given-names>
          </name>
          <degrees>BA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7269-4492</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Yoo</surname>
            <given-names>Jongman</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4294-7051</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Park</surname>
            <given-names>Jungmin</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff8" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5837-2494</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Han</surname>
            <given-names>Hyun Wook</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Biomedical Informatics</institution>
            <institution>CHA University of Medicine</institution>
            <addr-line>Pangyo-ro, 335</addr-line>
            <addr-line>Seongnam, KS009</addr-line>
            <country>Republic of Korea</country>
            <phone>82 31 881 7109</phone>
            <email>stepano7@gmail.com</email>
          </address>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6918-5694</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Biomedical Informatics</institution>
        <institution>CHA University of Medicine</institution>
        <addr-line>Seongnam</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Pathology</institution>
        <institution>Medstar Georgetown University Hospital</institution>
        <addr-line>Washington, DC, WA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Institute of Basic Medical Sciences</institution>
        <institution>School of Medicine</institution>
        <institution>CHA University</institution>
        <addr-line>Seongnam</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Ophthalmology</institution>
        <institution>CHA Bundang Medical Center</institution>
        <addr-line>Seongnam</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Health Convergence</institution>
        <institution>Ewha Womans University</institution>
        <addr-line>Seoul</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Department of Internal Medicine, Healthcare Research Institute</institution>
        <institution>Seoul National University Hospital Healthcare System Gangnam Center</institution>
        <addr-line>Seoul</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Department of Microbiology</institution>
        <institution>CHA University School of Medicine</institution>
        <addr-line>Seongnam</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff8">
        <label>8</label>
        <institution>Department of Nursing</institution>
        <institution>School of Nursing</institution>
        <institution>Hanyang University</institution>
        <addr-line>Seoul</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Hyun Wook Han <email>stepano7@gmail.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>4</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>9</day>
        <month>4</month>
        <year>2020</year>
      </pub-date>
      <volume>22</volume>
      <issue>4</issue>
      <elocation-id>e15196</elocation-id>
      <history>
        <date date-type="received">
          <day>28</day>
          <month>6</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>14</day>
          <month>8</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>8</day>
          <month>10</month>
          <year>2019</year>
        </date>
        <date date-type="accepted">
          <day>24</day>
          <month>1</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Kyungmin Ko, Chae Won Lee, Sangmin Nam, Song Vogue Ahn, Jung Ho Bae, Chi Yong Ban, Jongman Yoo, Jungmin Park, Hyun Wook Han. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 09.04.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2020/4/e15196" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>In the past 20 years, various methods have been introduced to construct disease networks. However, established disease networks have not been clinically useful to date because of differences among demographic factors, as well as the temporal order and intensity among disease-disease associations.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study sought to investigate the overall patterns of the associations among diseases; network properties, such as clustering, degree, and strength; and the relationship between the structure of disease networks and demographic factors.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We used National Health Insurance Service-National Sample Cohort (NHIS-NSC) data from the Republic of Korea, which included the time series insurance information of 1 million out of 50 million Korean (approximately 2%) patients obtained between 2002 and 2013. After setting the observation and outcome periods, we selected only 520 common Korean Classification of Disease, sixth revision codes that were the most prevalent diagnoses, making up approximately 80% of the cases, for statistical validity. Using these data, we constructed a directional and weighted temporal network that considered both demographic factors and network properties.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our disease network contained 294 nodes and 3085 edges, a relative risk value of more than 4, and a false discovery rate-adjusted <italic>P</italic> value of &#60;.001. Interestingly, our network presented four large clusters. Analysis of the network topology revealed a stronger correlation between in-strength and out-strength than between in-degree and out-degree. Further, the mean age of each disease population was related to the position along the regression line of the out/in-strength plot. Conversely, clustering analysis suggested that our network boasted four large clusters with different sex, age, and disease categories.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>We constructed a directional and weighted disease network visualizing demographic factors. Our proposed disease network model is expected to be a valuable tool for use by early clinical researchers seeking to explore the relationships among diseases in the future.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>cohort studies</kwd>
        <kwd>data science</kwd>
        <kwd>longitudinal studies</kwd>
        <kwd>statistical data interpretation</kwd>
        <kwd>medical informatics</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Traditionally, clinical researchers have pushed forward to explore a number of risk factors that affect a single disease [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>], and any diseases previously diagnosed are considered important clinical indicators to predict the disorder under investigation [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Among various methods for unearthing disease relationships, the concept of network medicine could be better suited to understand health and disease [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. Likewise, a disease network was introduced a decade ago as a useful method to study the complex relationships among diseases [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref17">17</xref>].</p>
      <p>Under the assumption that diseases are caused by genetic defects, many disease networks were constructed using genomic data [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. For example, Li et al constructed a network to investigate disease relationships according to the genes of their shared pathways [<xref ref-type="bibr" rid="ref14">14</xref>]. Nonetheless, according to the disease lists of the International Statistical Classification of Diseases, 10th revision (ICD-10), many diseases, such as traumatic bone fracture attributed to a traffic accident, are not related to genetic mutations. As such, genome-based disease networks alone are inevitably limited for accurately representing the complex pathogenesis of the relationships among diseases [<xref ref-type="bibr" rid="ref18">18</xref>].</p>
      <p>Thus, disease networks were later constructed using shared clinical information, such as symptoms and comorbidities [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. Zhou et al generated a symptom-based network of human diseases that was based on the similarity of symptoms [<xref ref-type="bibr" rid="ref17">17</xref>], whereas Hidalgo et al and Barabási et al constructed a comorbidity network using the Medicare database [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. Because these efforts were focused on demonstrating the relationships among shared diseases or symptoms occurring or present at a single point in time, the networks did not take into account investigations of the temporal order of disease manifestations [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
      <p>Recently, researchers have suggested that disease networks should consider temporal directionality when exploring the connections among diseases [<xref ref-type="bibr" rid="ref13">13</xref>]. For instance, Jensen et al analyzed temporal disease progression patterns according to disease trajectory using the Danish National Patient Registry. In this study, we constructed a directional and weighted disease network visualizing the effects of demographic factors, such as sex, age, and disease outbreak size, according to the relative risk (RR) among diseases using the National Health Insurance Service-National Sample Cohort (NHIS-NSC) of South Korea, which includes epidemiological time series data of 12 years for approximately 1 million patients.</p>
      <p>Finally, we investigated the overall patterns of the associations among diseases; network properties, such as clustering, degree, and strength; and the relationship between the structure of the disease network and demographic factors.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Construction and Visualization of the Disease Network</title>
        <p>South Korea is a representative country implementing national health insurance services. The NHIS-NSC contains time insurance information of 1 million out of 50 million Korean (approximately 2%) patients, which was collected between 2002 and 2013. Thus, clinical information can be tracked for 12 years for every patient.</p>
        <p>To examine the risk factors for diseases that a patient already had at the beginning of the cohort study, we needed to set an initial period before the main study period to serve as the medical history period. For most chronic diseases, the recommended follow-up interval rarely exceeds 2 years. Therefore, we set the observation period as 2002 through 2003 and the outcome period as 2004 through 2013.</p>
        <p>From the sample of 1,016,580 patients who were eligible for National Health Insurance in 2004, we selected 885,125 patients who had at least one record of a medical visit during the aforementioned observation period. We defined this group of patients as the sample cohort. In South Korea, diagnoses are coded in the Korean Classification of Diseases sixth revision (KCD-6), an extension of the ICD-10. The only difference between the KCD-6 and ICD-10 is that the diagnosis codes for Korean medicine are included in the KCD-6 using U20-U99 codes.</p>
        <p>To simplify the study, we truncated the KCD-6 codes beyond their third digit, in effect, grouping subcategories of conditions together. In total, the KCD-6, when used between 2002 and 2013, consisted of 2,097 unique diagnoses at the third digit level, and of these, 1,971 diagnoses were included in our data.</p>
        <p>Ultimately, we chose only 520 common KCD-6 codes that were the most prevalent diagnoses, covering approximately 80% of the cases for statistical validity.</p>
      </sec>
      <sec>
        <title>Support Offered by the Clinical Evidence From Relationships Among Diseases</title>
        <p>All statistical analyses and visualizations were performed using the R package “igraph” (version 3.4.4) and Cytoscape. For calculation of the RR, we sought to obtain <italic>P</italic> values against the null hypothesis, which states that any two diseases present occur independently of one another in the sample cohort. False-discovery rate (FDR) corrections were performed using the Bonferroni method.</p>
        <p>Clusters of associated diseases were identified using the random walktrap community detection algorithm [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. This method detects clusters purely according to connectivity (unless specified to use weights) using random walks along edges. The demographic profiling of disease clusters was carried out by pooling the patients identified with at least one of the diagnoses in the cluster.</p>
        <p>As a result, patient pools for each cluster are not exclusive but instead overlap somewhat with other clusters. The age distribution of the patient pools was calculated at the beginning of the observation period. An enrichment analysis of the clusters for the KCD categories was performed using the Fisher exact test for adjusted <italic>P</italic> values &#60;.05.</p>
      </sec>
      <sec>
        <title>Topological Characteristics of the Disease Network</title>
        <p>In graph theory, the degree of a node is the total number of connections with other nodes. In a directed network, the out-degree of a node is the number of connections with that node as the source, whereas the in-degree of a node is the number of connections with that node as the target. Hence, the degree can be thought of as a measure of the level of disease risk in our network.</p>
        <p>In contrast, the strength of a node is the sum of the RRs to achieve connections with other nodes. For example, the out-strength and in-strength of node <italic>i</italic> are defined, respectively, as follows:</p>
        <disp-formula>s<italic><sub>out</sub></italic> (<italic>i</italic>)=∑<italic><sub>j</sub></italic> RR<italic><sub>ij</sub></italic> (<bold>1</bold>)</disp-formula>
        <disp-formula>s<italic><sub>in</sub></italic> (<italic>i</italic>)=∑<italic><sub>j</sub></italic> RR<italic><sub>ji</sub></italic> (<bold>2</bold>)</disp-formula>
        <p>where <italic>RR<sub>ij</sub></italic> is the weight of the edge from node <italic>i</italic> to node <italic>j</italic>, and <italic>RR<sub>ji</sub></italic> is the weight of the edge from node <italic>j</italic> to node <italic>i</italic>. The out-strength is a measure of the magnitude of disease morbidity, whereas the in-strength is a measure of the magnitude of a disease’s tendency to follow from other diseases.</p>
      </sec>
      <sec>
        <title>Characterization of Large Clusters Throughout Computational Clustering</title>
        <p>To calculate the risk ratio from a risk disease D<sub>1</sub> to an outcome disease D<sub>2</sub> (D<sub>1</sub>→D<sub>2</sub>), we need to first identify the group of patients at risk of acquiring D<sub>2</sub>. We regarded a patient as being at risk of disease D<sub>2</sub> if that patient had no record of being diagnosed with D<sub>2</sub> during the observation period. Patients were considered to be exposed if they had been diagnosed at least once with disease D<sub>1</sub> during the observation period. The RR of D<sub>1</sub>→ D<sub>2</sub> was defined using the following formula:</p>
        <disp-formula>RR=(a / [a + b]) / (c / [c + d]) (<bold>3</bold>)</disp-formula>
        <p>where a is the number of patients exposed to D<sub>1</sub> in the initial period and D<sub>2</sub> in the outcome period; b is the number of patients exposed to D<sub>1</sub> in the initial period but not exposed to D<sub>2</sub> in the outcome period; c is the number of patients not exposed to D<sub>1</sub> in the initial period but exposed to D<sub>2</sub> in the outcome period; and d is the number of patients not exposed to either D<sub>1</sub> in the initial period or D<sub>2</sub> in the outcome period (<xref ref-type="table" rid="table1">Table 1</xref>).</p>
        <p>Since a single misdiagnosis can cause a very large error in the RR value if the numbers in the contingency table are small, we established a minimum size of 947 patients for each group. For example, the diagnosis with the highest prevalence in the initial period was “J20: acute bronchitis,” with 355,045 patients diagnosed at least once in the observation period.</p>
        <p>The lowest diagnosis was “R80: isolated proteinuria,” with 947 patients diagnosed during the observation period. Consequently, the at-risk group sizes ranged from 530,080 (885,125 − 355,045) for acute bronchitis to 884,178 (885,125 − 947) for isolated proteinuria.</p>
        <p>To select the cutoﬀ value for the RR, we chose the closest integer to the top percentile (ie, the closest integer to x where <italic>P</italic> [RR &#62; x] = .01], which was 4. Therefore, we selected disease relationships with an RR of more than 4 and an FDR-corrected <italic>P</italic> value of &#60;.001 to construct our ﬁnal network.</p>
        <p>Accordingly, the prevalence and at-risk group sizes were large enough to accurately determine the RR. Since the self-interaction in this study was not the subject, the total number of theoretical interactions of a total of 520 nodes was found to be 269,880.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Contingency table for disease-disease risk ratio calculation.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Risk disease in 2002-2003</td>
                <td colspan="2">Outcome disease in 2004-2013</td>
              </tr>
              <tr valign="top">
                <td>Exposed</td>
                <td colspan="2">Not exposed</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Exposed</td>
                <td>Value<sup>a</sup></td>
                <td>Value<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Not exposed</td>
                <td>Value<sup>c</sup></td>
                <td>Value<sup>d</sup></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Number of patients exposed to the risk disease (D<sub>1</sub>) and outcome disease (D<sub>2</sub>).</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>Number of patients exposed to D<sub>1</sub> but not exposed to D<sub>2</sub>.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>Number of patients not exposed to D<sub>1</sub> but exposed to D<sub>2</sub>.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>Number of patients not exposed to either D<sub>1</sub> or D<sub>2</sub>.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Construction and Visualization of the Disease Network</title>
        <p>Initially, for the construction and visualization of our final disease network, we selected an RR of more than 4 and an FDR-adjusted <italic>P</italic> value of &#60;.001. As a result, we were able to obtain a disease network with four clusters, 294 nodes, and 3085 edges (<xref rid="figure1" ref-type="fig">Figure 1</xref>).</p>
        <p>For better clinically intuitive visualization, we designed a visualization scheme such that the color of the disease node would reflect the age of the patient affected with the disease and that the outbreak size would reflect the relative number of patients. The shape of the node was indicated by a rectangle. Node widths represented the number of female patients, whereas the heights represented the number of male patients. For node colors, the intensity of the red channel was proportional to the ratio of patients younger than 30 years, the intensity of the green channel was proportional to the ratio of patients aged between 30 and 59 years, and the intensity of the blue channel was proportional to the ratio of patients aged 60 years or older.</p>
        <p>Meanwhile, to indicate the directionality and weight of the node, the edges were represented by arrows and the relative thickness was represented in gray. The number of patients in each sex and age group for each disease was calculated at the beginning of the outcome period based on the included patients’ histories during the observation period.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Visualization of the disease network. The network is constructed using the prefuse force-directed layout.</p>
          </caption>
          <graphic xlink:href="jmir_v22i4e15196_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Support Offered by the Clinical Evidence From Relationships Among Diseases</title>
        <p>To determine whether the correlations among inferred diseases in our disease network model were clinically meaningful, we investigated the available literature concerning the top six disease-disease associations with the highest RR values from the established disease network.</p>
        <p>Most results appeared in agreement with previously known associations among diseases (<xref ref-type="table" rid="table2">Table 2</xref>). A substantial nosologic and biologic overlap exists between bipolar disorder and schizophrenia [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. Further, long-standing hypertension is known to be an important cause and consequence of chronic kidney disease [<xref ref-type="bibr" rid="ref24">24</xref>]. It is also well-known that anemia develops into chronic kidney disease and portends an unfavorable prognosis [<xref ref-type="bibr" rid="ref25">25</xref>].</p>
        <p>Interestingly, the association between diabetes mellitus in pregnancy and neonatal jaundice was also very high, despite the fact that neonates are never pregnant. This outcome is possible because diagnoses for infants who are not yet in the national registry are filled out under the mother’s account for insurance [<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref28">28</xref>]. Another interesting aspect of our results was the fact that neonatal jaundice and diaper dermatitis were strongly associated with one another, which was not observed in previous epidemiological studies.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Top relative risk values.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="400"/>
            <col width="330"/>
            <col width="120"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td>Risk factor disease</td>
                <td>Outcome disease</td>
                <td>RR<sup>a</sup></td>
                <td>References</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Bipolar affective disorder</td>
                <td>Schizophrenia</td>
                <td>34.4</td>
                <td>[<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]</td>
              </tr>
              <tr valign="top">
                <td>Chronic kidney disease</td>
                <td>Hypertensive renal disease</td>
                <td>31.9</td>
                <td>[<xref ref-type="bibr" rid="ref24">24</xref>]</td>
              </tr>
              <tr valign="top">
                <td>Diabetes mellitus in pregnancy</td>
                <td>Neonatal jaundice</td>
                <td>29.1</td>
                <td>[<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref28">28</xref>]</td>
              </tr>
              <tr valign="top">
                <td>Neonatal jaundice</td>
                <td>Diaper dermatitis</td>
                <td>28.1</td>
                <td>N/A<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Chronic kidney disease</td>
                <td>Anemia in chronic disease</td>
                <td>27.4</td>
                <td>[<xref ref-type="bibr" rid="ref25">25</xref>]</td>
              </tr>
              <tr valign="top">
                <td>Hemorrhage in early pregnancy</td>
                <td>Neonatal jaundice</td>
                <td>26.1</td>
                <td>[<xref ref-type="bibr" rid="ref27">27</xref>]</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>RR: relative risk.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Topological Characteristics of the Disease Network</title>
        <p>We investigated the in- and out-degree distributions of our constructed network. Like many other networks, the in- and out-degrees of our network followed a power-law distribution with a long tail [<xref ref-type="bibr" rid="ref29">29</xref>] (<xref rid="figure2" ref-type="fig">Figure 2</xref>). However, in contrast with the degrees, neither in- nor out-strength followed the power-law distribution (<xref rid="figure3" ref-type="fig">Figure 3</xref>).</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Distribution of the network for in- and out-degrees.</p>
          </caption>
          <graphic xlink:href="jmir_v22i4e15196_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Distribution of the network for in- and out-strength.</p>
          </caption>
          <graphic xlink:href="jmir_v22i4e15196_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p><xref ref-type="table" rid="table3">Table 3</xref> shows the top six diseases with the highest out-degree, in-degree, out-strength, and in-strength results. The top out-degree diseases included diseases that are known to affect many other conditions such as chronic kidney disease and essential hypertension.</p>
        <p>The top in-degree diseases are known to be associated with long-term hospitalization or immunocompromise, which are statuses that can arise from various diseases. The top out-degree and top out-strength diseases had considerable overlap, with polyneuropathy, senile cataract, and retinal disorders all being both high out-degree and high out-strength diseases. Patients with these diseases may be at greater risk for developing multiple comorbidities.</p>
        <p>The top in-degree and top in-strength diseases included Parkinson disease, chronic kidney disease, anemia in chronic disease, and osteoporosis with pathological fracture. This suggests that many different diseases can have a strong tendency for coverage onto these diseases. Subsequently, we explored the relationships between out-degree and in-degree and between out-strength and in-strength results.</p>
        <p>The correlation between the out-strength and in-strength findings (Pearson correlation coefficient: 0.72) was stronger than that between the out-degree and in-degree findings (Pearson correlation coefficient: 0.57) (<xref rid="figure4" ref-type="fig">Figure 4</xref>). This means that diseases show strong tendencies to develop from other diseases. For better characterization, we color-coded the diseases in the out-/in-strength plot according to the age composition of the patients (<xref rid="figure5" ref-type="fig">Figure 5</xref>). This revealed that mean age was related with positioning along the regression line of the out-/in-strength plot.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Top out-/in-degree diseases and top out-/in-strength diagnoses.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="470"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td colspan="2">KCD<sup>a</sup> code and disease</td>
                <td>Degree</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Top out-degree diseases</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>G63: polyneuropathy</td>
                <td>43</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>C61: malignant neoplasm of the prostate</td>
                <td>43</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>H25: senile cataract</td>
                <td>43</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>H36: retinal disorders</td>
                <td>42</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N18: chronic kidney disease</td>
                <td>42</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>I10: essential hypertension</td>
                <td>39</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Top in-degree diseases</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>G20: Parkinson disease</td>
                <td>82</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>M80: osteoporosis with pathological fracture</td>
                <td>64</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N18: chronic kidney disease</td>
                <td>62</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>D63: anemia in chronic diseases</td>
                <td>61</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>A41: sepsis</td>
                <td>59</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Top out-strength diseases</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>G63: polyneuropathy</td>
                <td>1057</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>H36: retinal disorders</td>
                <td>998</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>M48: spondylopathies</td>
                <td>992</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>H25: senile cataract</td>
                <td>992</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>M81: osteoporosis without pathological fracture</td>
                <td>981</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>M17: arthrosis of the knee</td>
                <td>979</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Top in-strength diseases</bold>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>G20: Parkinson disease</td>
                <td>1197</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>N18: chronic kidney disease</td>
                <td>1135</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>D63: anemia in chronic diseases</td>
                <td>1123</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>M80: osteoporosis with pathological fracture</td>
                <td>1120</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>I12: hypertensive renal disease</td>
                <td>1100</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>H27: disorder of the lens</td>
                <td>1089</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>KCD: Korean Classification of Diseases.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Correlations between in- and out-degrees and in- and out-strengths.</p>
          </caption>
          <graphic xlink:href="jmir_v22i4e15196_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Out- and in-strengths plotted according to the age composition of the patients.</p>
          </caption>
          <graphic xlink:href="jmir_v22i4e15196_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Characterization of Large Clusters Throughout Computational Clustering</title>
        <p>To confirm whether the visually observed clustering in <xref rid="figure1" ref-type="fig">Figure 1</xref> was an artifact of the layout algorithm, we employed a random walktrap algorithm for network clustering [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>].</p>
        <p>A total of 19 clusters were detected, including four large clusters of a size greater than 38 and 15 small clusters of a size less than 13. When we color-coded the network using these four major clusters, we could see that the top right and top left clusters were almost exactly as visualized, but the largest cluster was detected as two large subclusters (<xref rid="figure6" ref-type="fig">Figure 6</xref>).</p>
        <p>This confirmed that disease associations grouped diseases into a few distinct clusters and that this occurred independently of the prefuse force-directed layout. Interestingly, the modularity score for the random walktrap algorithm (0.53) was more than twice the score for the KCD categories (0.24). To see whether the four major clusters actually had the characteristics that we noticed in the visualization, we profiled the clusters with respect to the age distribution and sex ratio of the affected patients (<xref rid="figure7" ref-type="fig">Figure 7</xref>).</p>
        <p>Patients diagnosed with diseases in clusters 1 and 3 were relatively older (mean age of 47.4 [SD 18.22] years and 48.19 [SD 18.66] years, respectively). The diseases in cluster 2 were dominated by women of reproductive age (the ratio of males to females was 1:18.67; mean age: 39.38 [SD 13.08] years). Cluster 4 included patients who were relatively young, with slightly more females (the ratio of males to females was 1:1.22; mean age: 31.7 [SD 21.56] years).</p>
        <p>We profiled the KCD classes of each cluster and performed an enrichment analysis to investigate the types of diseases that were enriched in each cluster (<italic>P</italic>=.05). Although every cluster contained its own disease groups (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), the enrichment analysis revealed that each of the four major clusters was enriched with nonoverlapping sets of KCD categories (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). Since each cluster had distinct characteristics, we labeled the major clusters from 1 to 4, according to their most prominent features, as “chronic debilitation,” “women’s disease,” “hemato-oncology,” and “infectious disease” clusters, respectively.</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Four major clusters of the network.</p>
          </caption>
          <graphic xlink:href="jmir_v22i4e15196_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Age distribution and sex ratio for the four major clusters.</p>
          </caption>
          <graphic xlink:href="jmir_v22i4e15196_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this study, we proposed a comprehensive method for modeling a disease network with directionality and weight of edges using medical claims data. We selected only the most common diagnoses to avoid an overestimation of RR among rare diseases. The ϕ correlation is also useful to avoid overestimation of associations among rare diseases [<xref ref-type="bibr" rid="ref12">12</xref>], but it is clinically less intuitive and unnecessary for the purpose of studying the overall pattern of common disease associations. Epidemiological factors, such as age and sex, are important inducers of disease development [<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref33">33</xref>]; they are, in effect, the most critical clinical factors affecting the prevalence and classification of diseases.</p>
        <p>Another purpose of this study was to dissolve these various factors in the disease network and to see how various factors affect the structure and dynamics of the disease network. In addition, these factors were reflected in the visualization of the disease network. In our disease network model, we proposed an intuitive visualization method that maximizes clinical usability.</p>
        <p>Nodes indicate the patient outbreak size, and at the same time, represent the relative proportion of width (women) and height (men) in a rectangle. In addition, each node is divided into red for young patients, green for middle-aged patients, and blue for old patients. Conversely, the RR and direction among diseases can be intuitively grasped through the arrow and the thickness of the edge.</p>
        <p>As a result, our visualization method of a disease network can help to intuitively identify the direction and RR among diseases and can help to effectively understand the age distribution, sex ratio, and disease outbreak size. The directionality of the disease relationship is a consequence of the study design being longitudinal with a chronological order. Strong RR values support disease association in a chronological order, which is a prerequisite for causality among diseases in clinical research [<xref ref-type="bibr" rid="ref34">34</xref>]. Because of this, our network can be a starting point to investigate causality among diseases. Here, we examined the literature on disease relationships with high RRs.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>The NHIS-NSC includes the proportional stratified sampling data of 1,025,340 patients from among 47,851,928 patients. These patients were randomly extracted by age group, sex, eligibility status, and income level using a proportional stratified sampling method [<xref ref-type="bibr" rid="ref35">35</xref>]. In general, NHIS-NSC data are representative, but some rare diseases may lose their representativeness owing to the difficulty in obtaining statistical significance. Owing to these limitations, this study excluded disease groups with a small sample size, and rare diseases that have not been assessed in this study are expected to be evaluated in future studies.</p>
        <p>As a result, we have shown that our network can provide clues to reveal the causal relationships among diseases. In our network, neonatal jaundice and diaper dermatitis presented a statistically meaningful association (RR=28.1, <italic>P</italic>&#60;.001), but we did not find other supporting evidence of such an association during the literature search. Nonetheless, this does not mean that our network had an incorrect result. Rather, it suggests the possibility of associations that researchers have not yet discovered. In a strict sense, it can be difficult to say that this is a causal relationship because directionality can only be thought of as the natural progression of a disease, the outcome of a treatment, or the process of making a diagnosis.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>During our research, we investigated network topologies, such as degree and strength. Both in- and out-degrees followed power-law distribution like other biological networks; however, strength distributions did not. Since the RR values did not indicate causality, we cannot say that a certain disease is the cause of many other diseases by only looking at out-degrees and out-strengths. Despite this, patients with high out-degree and high out-strength diseases (eg, polyneuropathy, retinal disorders, and senile cataract) are worthy of special attention for secondary prevention purposes. Similarly, diseases with high in-degree and high in-strength findings, such as Parkinson disease, osteoporosis with pathological fracture, and chronic kidney disease, can be seen as common comorbidities of many different diseases.</p>
        <p>We found stronger correlations between in- and out-strengths than between in- and out-degrees. Moreover, a stronger risk associated with a disease tended to be related to older affected patients. The association between age and strength suggested that the previously discovered correlation between disease connectivity and mortality could be explained by the phenomenon of increased risk strength.</p>
        <p>Through clustering of the network, we found four major disease clusters with distinct demographic characteristics. Interestingly, each cluster was exclusively enriched in KCD categories and had a different mean age and sex ratio. The clustering patterns analyzed using our network suggest that KCD categories, age, and sex have strong influences on disease associations and highlight the importance of demographic factors. Since patients with diseases within a cluster tend to acquire other diseases within the same cluster, we may be able to minimize the onset of comorbidities through patient care by configuring specialty clinics to cater to clusters or subclusters of associated diseases, as is the case with obstetrics and gynecology.</p>
        <p>In this regard, our proposed disease network model will likely serve as a valuable tool for early clinical researchers seeking to further explore the relationships of diseases in the future.</p>
        <p>For future study attempts, we will take into account the dynamicity of network-considered time order and assess the network collapse point that can affect the overall network structure.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Korean Classification of Diseases composition of disease nodes in each cluster. The composition of each disease cluster in terms of disease categories is shown in this bar chart.</p>
        <media xlink:href="jmir_v22i4e15196_app1.docx" xlink:title="DOCX File , 238 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Enrichment analyses revealed that each of the four major communities was enriched with nonoverlapping sets of Korean Classification of Diseases categories.</p>
        <media xlink:href="jmir_v22i4e15196_app2.docx" xlink:title="DOCX File , 14 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">FDR</term>
          <def>
            <p>false-discovery rate</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ICD-10</term>
          <def>
            <p>International Statistical Classification of Diseases, 10th version</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">KCD-6</term>
          <def>
            <p>Korean Classification of Diseases, sixth revision</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">NHIS-NSC</term>
          <def>
            <p>National Health Insurance Service-National Sample Cohort</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">RR</term>
          <def>
            <p>relative risk</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by the Basic Science Research Program through the National Research Foundation of Korea funded by the Ministry of Science, ICT &#38; Future Planning (NRF-2017R1E1A1A03070934) and the Ministry of Science &#38; ICT (NRF-2019M3C7A1032262).</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>HWH conceived the project; HWH, SVA, JHB, and NSM designed the research; KMK and JMP performed the research; KMK and JMY analyzed the data; and CWL, CYB, and HWH wrote the paper.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mooe</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Björklund</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Graipe</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Huber</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jakobsson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kajermo</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Strömvall</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ulvenstam</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The Nurse-Based Age Independent Intervention to Limit Evolution of Disease After Acute Coronary Syndrome (NAILED ACS) Risk Factor Trial: Protocol for a Randomized Controlled Trial</article-title>
          <source>JMIR Res Protoc</source>
          <year>2014</year>
          <month>08</month>
          <day>15</day>
          <volume>3</volume>
          <issue>3</issue>
          <fpage>e42</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchprotocols.org/2014/3/e42/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/resprot.3466</pub-id>
          <pub-id pub-id-type="medline">25131960</pub-id>
          <pub-id pub-id-type="pii">v3i3e42</pub-id>
          <pub-id pub-id-type="pmcid">PMC4147706</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Detecting Lifestyle Risk Factors for Chronic Kidney Disease With Comorbidities: Association Rule Mining Analysis of Web-Based Survey Data</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>12</month>
          <day>10</day>
          <volume>21</volume>
          <issue>12</issue>
          <fpage>e14204</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/12/e14204/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/14204</pub-id>
          <pub-id pub-id-type="medline">31821152</pub-id>
          <pub-id pub-id-type="pii">v21i12e14204</pub-id>
          <pub-id pub-id-type="pmcid">PMC6930505</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tluway</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Urio</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Mmbando</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sangeda</surname>
              <given-names>RZ</given-names>
            </name>
            <name name-style="western">
              <surname>Makubi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Makani</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Possible Risk Factors for Severe Anemia in Hospitalized Sickle Cell Patients at Muhimbili National Hospital, Tanzania: Protocol for a Cross-Sectional Study</article-title>
          <source>JMIR Res Protoc</source>
          <year>2018</year>
          <month>02</month>
          <day>28</day>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>e46</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchprotocols.org/2018/2/e46/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/resprot.7349</pub-id>
          <pub-id pub-id-type="medline">29490896</pub-id>
          <pub-id pub-id-type="pii">v7i2e46</pub-id>
          <pub-id pub-id-type="pmcid">PMC5856920</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Linet</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vajdic</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Morton</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>de Roos</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Skibola</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Boffetta</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Cerhan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Flowers</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>de Sanjosé</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Monnereau</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cocco</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kelly</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weisenburger</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Clarke</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Blair</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstein</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Miligi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Clavel</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Benavente</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Medical history, lifestyle, family history, and occupational risk factors for follicular lymphoma: the InterLymph Non-Hodgkin Lymphoma Subtypes Project</article-title>
          <source>J Natl Cancer Inst Monogr</source>
          <year>2014</year>
          <month>08</month>
          <volume>2014</volume>
          <issue>48</issue>
          <fpage>26</fpage>
          <lpage>40</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25174024"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jncimonographs/lgu006</pub-id>
          <pub-id pub-id-type="medline">25174024</pub-id>
          <pub-id pub-id-type="pii">lgu006</pub-id>
          <pub-id pub-id-type="pmcid">PMC4155461</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Silverman</surname>
              <given-names>DT</given-names>
            </name>
            <name name-style="western">
              <surname>Schiffman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Everhart</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lillemoe</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Swanson</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Greenberg</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Schoenberg</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Pottern</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Hoover</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>Fraumeni</surname>
              <given-names>JF</given-names>
            </name>
          </person-group>
          <article-title>Diabetes mellitus, other medical conditions and familial history of cancer as risk factors for pancreatic cancer</article-title>
          <source>Br J Cancer</source>
          <year>1999</year>
          <month>08</month>
          <volume>80</volume>
          <issue>11</issue>
          <fpage>1830</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/10468306"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sj.bjc.6690607</pub-id>
          <pub-id pub-id-type="medline">10468306</pub-id>
          <pub-id pub-id-type="pmcid">PMC2363127</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tillmann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gibson</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Harrison</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Dominiczak</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hanlon</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Systems Medicine 2.0: potential benefits of combining electronic health care records with systems science models</article-title>
          <source>J Med Internet Res</source>
          <year>2015</year>
          <month>03</month>
          <day>23</day>
          <volume>17</volume>
          <issue>3</issue>
          <fpage>e64</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2015/3/e64/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.3082</pub-id>
          <pub-id pub-id-type="medline">25831125</pub-id>
          <pub-id pub-id-type="pii">v17i3e64</pub-id>
          <pub-id pub-id-type="pmcid">PMC4387294</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Barabási</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Gulbahce</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Loscalzo</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Network medicine: a network-based approach to human disease</article-title>
          <source>Nat Rev Genet</source>
          <year>2011</year>
          <month>01</month>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>56</fpage>
          <lpage>68</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21164525"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/nrg2918</pub-id>
          <pub-id pub-id-type="medline">21164525</pub-id>
          <pub-id pub-id-type="pii">nrg2918</pub-id>
          <pub-id pub-id-type="pmcid">PMC3140052</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Loscalzo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Barabasi</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Systems biology and the future of medicine</article-title>
          <source>Wiley Interdiscip Rev Syst Biol Med</source>
          <year>2011</year>
          <volume>3</volume>
          <issue>6</issue>
          <fpage>619</fpage>
          <lpage>27</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21928407"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/wsbm.144</pub-id>
          <pub-id pub-id-type="medline">21928407</pub-id>
          <pub-id pub-id-type="pmcid">PMC3188693</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Al-Harazi</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Al Insaif</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Ajlan</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Kaya</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dzimiri</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Colak</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Integrated Genomic and Network-Based Analyses of Complex Diseases and Human Disease Network</article-title>
          <source>J Genet Genomics</source>
          <year>2016</year>
          <month>06</month>
          <day>20</day>
          <volume>43</volume>
          <issue>6</issue>
          <fpage>349</fpage>
          <lpage>67</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jgg.2015.11.002</pub-id>
          <pub-id pub-id-type="medline">27318646</pub-id>
          <pub-id pub-id-type="pii">S1673-8527(15)00211-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Chawla</surname>
              <given-names>NV</given-names>
            </name>
          </person-group>
          <article-title>Exploring and exploiting disease interactions from multi-relational gene and phenotype networks</article-title>
          <source>PLoS One</source>
          <year>2011</year>
          <volume>6</volume>
          <issue>7</issue>
          <fpage>e22670</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0022670"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0022670</pub-id>
          <pub-id pub-id-type="medline">21829475</pub-id>
          <pub-id pub-id-type="pii">PONE-D-11-01204</pub-id>
          <pub-id pub-id-type="pmcid">PMC3146471</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goh</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Cusick</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Valle</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Childs</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Vidal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Barabási</surname>
              <given-names>AL</given-names>
            </name>
          </person-group>
          <article-title>The human disease network</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2007</year>
          <month>05</month>
          <day>22</day>
          <volume>104</volume>
          <issue>21</issue>
          <fpage>8685</fpage>
          <lpage>90</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&#38;pmid=17502601"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.0701361104</pub-id>
          <pub-id pub-id-type="medline">17502601</pub-id>
          <pub-id pub-id-type="pii">0701361104</pub-id>
          <pub-id pub-id-type="pmcid">PMC1885563</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hidalgo</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Blumm</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Barabási</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Christakis</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>A dynamic network approach for the study of human phenotypes</article-title>
          <source>PLoS Comput Biol</source>
          <year>2009</year>
          <month>04</month>
          <volume>5</volume>
          <issue>4</issue>
          <fpage>e1000353</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pcbi.1000353"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pcbi.1000353</pub-id>
          <pub-id pub-id-type="medline">19360091</pub-id>
          <pub-id pub-id-type="pmcid">PMC2661364</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Moseley</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Oprea</surname>
              <given-names>TI</given-names>
            </name>
            <name name-style="western">
              <surname>Ellesøe</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Eriksson</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Schmock</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Brunak</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Temporal disease trajectories condensed from population-wide registry data covering 6.2 million patients</article-title>
          <source>Nat Commun</source>
          <year>2014</year>
          <month>06</month>
          <day>24</day>
          <volume>5</volume>
          <fpage>4022</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24959948"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/ncomms5022</pub-id>
          <pub-id pub-id-type="medline">24959948</pub-id>
          <pub-id pub-id-type="pii">ncomms5022</pub-id>
          <pub-id pub-id-type="pmcid">PMC4090719</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>A pathway-based view of human diseases and disease relationships</article-title>
          <source>PLoS One</source>
          <year>2009</year>
          <volume>4</volume>
          <issue>2</issue>
          <fpage>e4346</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0004346"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0004346</pub-id>
          <pub-id pub-id-type="medline">19194489</pub-id>
          <pub-id pub-id-type="pmcid">PMC2631151</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Christakis</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Barabási</surname>
              <given-names>AL</given-names>
            </name>
          </person-group>
          <article-title>The impact of cellular networks on disease comorbidity</article-title>
          <source>Mol Syst Biol</source>
          <year>2009</year>
          <volume>5</volume>
          <fpage>262</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/msb.2009.16"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/msb.2009.16</pub-id>
          <pub-id pub-id-type="medline">19357641</pub-id>
          <pub-id pub-id-type="pii">msb200916</pub-id>
          <pub-id pub-id-type="pmcid">PMC2683720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lv</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>The expanded human disease network combining protein-protein interaction information</article-title>
          <source>Eur J Hum Genet</source>
          <year>2011</year>
          <month>07</month>
          <volume>19</volume>
          <issue>7</issue>
          <fpage>783</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.1038/ejhg.2011.30"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/ejhg.2011.30</pub-id>
          <pub-id pub-id-type="medline">21386875</pub-id>
          <pub-id pub-id-type="pii">ejhg201130</pub-id>
          <pub-id pub-id-type="pmcid">PMC3137500</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Menche</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Barabási</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Human symptoms-disease network</article-title>
          <source>Nat Commun</source>
          <year>2014</year>
          <month>06</month>
          <day>26</day>
          <volume>5</volume>
          <fpage>4212</fpage>
          <pub-id pub-id-type="doi">10.1038/ncomms5212</pub-id>
          <pub-id pub-id-type="medline">24967666</pub-id>
          <pub-id pub-id-type="pii">ncomms5212</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Vogelstein</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Parmigiani</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kinzler</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Vogelstein</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Velculescu</surname>
              <given-names>VE</given-names>
            </name>
          </person-group>
          <article-title>The predictive capacity of personal genome sequencing</article-title>
          <source>Sci Transl Med</source>
          <year>2012</year>
          <month>05</month>
          <day>09</day>
          <volume>4</volume>
          <issue>133</issue>
          <fpage>133ra58</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://stm.sciencemag.org/cgi/pmidlookup?view=long&#38;pmid=22472521"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/scitranslmed.3003380</pub-id>
          <pub-id pub-id-type="medline">22472521</pub-id>
          <pub-id pub-id-type="pii">scitranslmed.3003380</pub-id>
          <pub-id pub-id-type="pmcid">PMC3741669</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gross</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>What systems biology can tell us about disease</article-title>
          <source>Hist Philos Life Sci</source>
          <year>2011</year>
          <volume>33</volume>
          <issue>4</issue>
          <fpage>477</fpage>
          <lpage>96</lpage>
          <pub-id pub-id-type="medline">22662506</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pons</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Latapy</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Computing communities in large networks using random walks</article-title>
          <source>Computer and Information Sciences</source>
          <year>2005</year>
          <conf-name>20th International Conference on Computer and Information Sciences</conf-name>
          <conf-date>October 26-28</conf-date>
          <conf-loc>Istanbul, Turkey</conf-loc>
          <publisher-loc>Berlin, Heidelberg</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>284</fpage>
          <lpage>293</lpage>
          <pub-id pub-id-type="doi">10.1007/11569596_31</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rosvall</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bergstrom</surname>
              <given-names>CT</given-names>
            </name>
          </person-group>
          <article-title>Maps of random walks on complex networks reveal community structure</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2008</year>
          <month>01</month>
          <day>29</day>
          <volume>105</volume>
          <issue>4</issue>
          <fpage>1118</fpage>
          <lpage>23</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&#38;pmid=18216267"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.0706851105</pub-id>
          <pub-id pub-id-type="medline">18216267</pub-id>
          <pub-id pub-id-type="pii">0706851105</pub-id>
          <pub-id pub-id-type="pmcid">PMC2234100</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Laursen</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Agerbo</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Pedersen</surname>
              <given-names>CB</given-names>
            </name>
          </person-group>
          <article-title>Bipolar disorder, schizoaffective disorder, and schizophrenia overlap: a new comorbidity index</article-title>
          <source>J Clin Psychiatry</source>
          <year>2009</year>
          <month>10</month>
          <volume>70</volume>
          <issue>10</issue>
          <fpage>1432</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.4088/JCP.08m04807</pub-id>
          <pub-id pub-id-type="medline">19538905</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pearlson</surname>
              <given-names>GD</given-names>
            </name>
          </person-group>
          <article-title>Etiologic, phenomenologic, and endophenotypic overlap of schizophrenia and bipolar disorder</article-title>
          <source>Annu Rev Clin Psychol</source>
          <year>2015</year>
          <volume>11</volume>
          <fpage>251</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.1146/annurev-clinpsy-032814-112915</pub-id>
          <pub-id pub-id-type="medline">25581236</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gargiulo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Suhail</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lerma</surname>
              <given-names>EV</given-names>
            </name>
          </person-group>
          <article-title>Hypertension and chronic kidney disease</article-title>
          <source>Dis Mon</source>
          <year>2015</year>
          <month>09</month>
          <volume>61</volume>
          <issue>9</issue>
          <fpage>387</fpage>
          <lpage>95</lpage>
          <pub-id pub-id-type="doi">10.1016/j.disamonth.2015.07.003</pub-id>
          <pub-id pub-id-type="medline">26328515</pub-id>
          <pub-id pub-id-type="pii">S0011-5029(15)00101-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Iseki</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kohagura</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Anemia as a risk factor for chronic kidney disease</article-title>
          <source>Kidney Int Suppl</source>
          <year>2007</year>
          <month>11</month>
          <issue>107</issue>
          <fpage>S4</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0085-2538(15)52556-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sj.ki.5002481</pub-id>
          <pub-id pub-id-type="medline">17943141</pub-id>
          <pub-id pub-id-type="pii">S0085-2538(15)52556-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alam</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Raza</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sherali</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Akhtar</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Neonatal complications in infants born to diabetic mothers</article-title>
          <source>J Coll Physicians Surg Pak</source>
          <year>2006</year>
          <month>03</month>
          <volume>16</volume>
          <issue>3</issue>
          <fpage>212</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="medline">16542603</pub-id>
          <pub-id pub-id-type="pii">040579197</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Kanguru</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hussein</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fitzmaurice</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ritchie</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Incidence of adverse outcomes associated with gestational diabetes mellitus in low- and middle-income countries</article-title>
          <source>Int J Gynaecol Obstet</source>
          <year>2013</year>
          <month>04</month>
          <volume>121</volume>
          <issue>1</issue>
          <fpage>14</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijgo.2012.10.032</pub-id>
          <pub-id pub-id-type="medline">23321368</pub-id>
          <pub-id pub-id-type="pii">S0020-7292(12)00674-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cummings</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>O'connell</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jangaard</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Fetal and neonatal outcomes of diabetic pregnancies</article-title>
          <source>Obstet Gynecol</source>
          <year>2006</year>
          <month>09</month>
          <volume>108</volume>
          <issue>3 Pt 1</issue>
          <fpage>644</fpage>
          <lpage>50</lpage>
          <pub-id pub-id-type="doi">10.1097/01.AOG.0000231688.08263.47</pub-id>
          <pub-id pub-id-type="medline">16946226</pub-id>
          <pub-id pub-id-type="pii">108/3/644</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Albert</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Scale-free networks in cell biology</article-title>
          <source>J Cell Sci</source>
          <year>2005</year>
          <month>11</month>
          <day>01</day>
          <volume>118</volume>
          <issue>Pt 21</issue>
          <fpage>4947</fpage>
          <lpage>57</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://jcs.biologists.org/cgi/pmidlookup?view=long&#38;pmid=16254242"/>
          </comment>
          <pub-id pub-id-type="doi">10.1242/jcs.02714</pub-id>
          <pub-id pub-id-type="medline">16254242</pub-id>
          <pub-id pub-id-type="pii">118/21/4947</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kasen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Velez</surname>
              <given-names>CN</given-names>
            </name>
            <name name-style="western">
              <surname>Hartmark</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rojas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brook</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Streuning</surname>
              <given-names>EL</given-names>
            </name>
          </person-group>
          <article-title>An epidemiological study of disorders in late childhood and adolescence--I. Age- and gender-specific prevalence</article-title>
          <source>J Child Psychol Psychiatry</source>
          <year>1993</year>
          <month>09</month>
          <volume>34</volume>
          <issue>6</issue>
          <fpage>851</fpage>
          <lpage>67</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1469-7610.1993.tb01094.x</pub-id>
          <pub-id pub-id-type="medline">8408371</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Farrer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cupples</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Haines</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hyman</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kukull</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Mayeux</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Myers</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Pericak-Vance</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Risch</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>van Duijn</surname>
              <given-names>CM</given-names>
            </name>
          </person-group>
          <article-title>Effects of age, sex, and ethnicity on the association between apolipoprotein E genotype and Alzheimer disease. A meta-analysis. APOE and Alzheimer Disease Meta Analysis Consortium</article-title>
          <source>JAMA</source>
          <year>1997</year>
          <volume>278</volume>
          <issue>16</issue>
          <fpage>1349</fpage>
          <lpage>56</lpage>
          <pub-id pub-id-type="medline">9343467</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meisinger</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Thorand</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stieber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Döring</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Löwel</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Sex differences in risk factors for incident type 2 diabetes mellitus: the MONICA Augsburg cohort study</article-title>
          <source>Arch Intern Med</source>
          <year>2002</year>
          <month>01</month>
          <day>14</day>
          <volume>162</volume>
          <issue>1</issue>
          <fpage>82</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1001/archinte.162.1.82</pub-id>
          <pub-id pub-id-type="medline">11784224</pub-id>
          <pub-id pub-id-type="pii">ioi01008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Piccinelli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wilkinson</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Gender differences in depression. Critical review</article-title>
          <source>Br J Psychiatry</source>
          <year>2000</year>
          <month>12</month>
          <volume>177</volume>
          <fpage>486</fpage>
          <lpage>92</lpage>
          <pub-id pub-id-type="doi">10.1192/bjp.177.6.486</pub-id>
          <pub-id pub-id-type="medline">11102321</pub-id>
          <pub-id pub-id-type="pii">S0007125000155989</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Causality modeling for directed disease network</article-title>
          <source>Bioinformatics</source>
          <year>2016</year>
          <month>09</month>
          <day>01</day>
          <volume>32</volume>
          <issue>17</issue>
          <fpage>i437</fpage>
          <lpage>i444</lpage>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btw439</pub-id>
          <pub-id pub-id-type="medline">27587660</pub-id>
          <pub-id pub-id-type="pii">btw439</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Cohort Profile: The National Health Insurance Service-National Sample Cohort (NHIS-NSC), South Korea</article-title>
          <source>Int J Epidemiol</source>
          <year>2017</year>
          <month>04</month>
          <day>01</day>
          <volume>46</volume>
          <issue>2</issue>
          <fpage>e15</fpage>
          <pub-id pub-id-type="doi">10.1093/ije/dyv319</pub-id>
          <pub-id pub-id-type="medline">26822938</pub-id>
          <pub-id pub-id-type="pii">dyv319</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
