<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v27i1e48775</article-id>
      <article-id pub-id-type="pmid">39932771</article-id>
      <article-id pub-id-type="doi">10.2196/48775</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Subtyping Social Determinants of Health in the "All of Us" Program: Network Analysis and Visualization Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Clark</surname>
            <given-names>Cheryl</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Bhavnani</surname>
            <given-names>Suresh K</given-names>
          </name>
          <degrees>MArch, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>School of Public and Population Health</institution>
            <institution>Department of Biostatistics &amp; Data Science</institution>
            <institution>University of Texas Medical Branch</institution>
            <addr-line>301 University Boulevard</addr-line>
            <addr-line>Galveston, TX, 77555</addr-line>
            <country>United States</country>
            <phone>1 (734) 772 1929</phone>
            <email>subhavna@utmb.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9282-8838</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Weibin</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6161-0978</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Bao</surname>
            <given-names>Daniel</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3913-0609</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Raji</surname>
            <given-names>Mukaila</given-names>
          </name>
          <degrees>MSc, MD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7460-7281</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Ajewole</surname>
            <given-names>Veronica</given-names>
          </name>
          <degrees>PharmD, BCOP</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6619-2979</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Hunter</surname>
            <given-names>Rodney</given-names>
          </name>
          <degrees>PharmD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-3357-6827</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Kuo</surname>
            <given-names>Yong-Fang</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1927-0927</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Schmidt</surname>
            <given-names>Susanne</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7684-1648</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Pappadis</surname>
            <given-names>Monique R</given-names>
          </name>
          <degrees>PhD, MEd</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4742-4380</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Smith</surname>
            <given-names>Elise</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4615-8204</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Bokov</surname>
            <given-names>Alex</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0511-9815</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author">
          <name name-style="western">
            <surname>Reistetter</surname>
            <given-names>Timothy</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff8" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1732-5533</ext-link>
        </contrib>
        <contrib id="contrib13" contrib-type="author">
          <name name-style="western">
            <surname>Visweswaran</surname>
            <given-names>Shyam</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff9" ref-type="aff">9</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2079-8684</ext-link>
        </contrib>
        <contrib id="contrib14" contrib-type="author">
          <name name-style="western">
            <surname>Downer</surname>
            <given-names>Brian</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5792-0527</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>School of Public and Population Health</institution>
        <institution>Department of Biostatistics &amp; Data Science</institution>
        <institution>University of Texas Medical Branch</institution>
        <addr-line>Galveston, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Radiology</institution>
        <institution>Houston Methodist</institution>
        <addr-line>Houston, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Internal Medicine</institution>
        <institution>Division of Geriatrics Medicine</institution>
        <institution>University of Texas Medical Branch</institution>
        <addr-line>Galveston, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>College of Pharmacy and Health Sciences</institution>
        <institution>Department of Pharmacy Practice</institution>
        <institution>Texas Southern University</institution>
        <addr-line>Houston, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Population Health Sciences</institution>
        <institution>University of Texas Health San Antonio</institution>
        <addr-line>San Antonio, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>School of Public and Population Health</institution>
        <institution>Department of Population Health &amp; Health Disparities</institution>
        <institution>University of Texas Medical Branch</institution>
        <addr-line>Galveston, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>School of Public and Population Health</institution>
        <institution>Department of Bioethics &amp; Health Humanities</institution>
        <institution>University of Texas Medical Branch</institution>
        <addr-line>Galveston, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff8">
        <label>8</label>
        <institution>School of Health Professions</institution>
        <institution>Department of Occupational Therapy</institution>
        <institution>University of Texas Health San Antonio</institution>
        <addr-line>San Antonio, TX</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff9">
        <label>9</label>
        <institution>Department of Biomedical Informatics</institution>
        <institution>University of Pittsburgh</institution>
        <addr-line>Pittsburgh, PA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Suresh K Bhavnani <email>subhavna@utmb.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>11</day>
        <month>2</month>
        <year>2025</year>
      </pub-date>
      <volume>27</volume>
      <elocation-id>e48775</elocation-id>
      <history>
        <date date-type="received">
          <day>6</day>
          <month>5</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>5</day>
          <month>6</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>6</day>
          <month>7</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>13</day>
          <month>5</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Suresh K Bhavnani, Weibin Zhang, Daniel Bao, Mukaila Raji, Veronica Ajewole, Rodney Hunter, Yong-Fang Kuo, Susanne Schmidt, Monique R Pappadis, Elise Smith, Alex Bokov, Timothy Reistetter, Shyam Visweswaran, Brian Downer. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 11.02.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2025/1/e48775" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Social determinants of health (SDoH), such as financial resources and housing stability, account for between 30% and 55% of people’s health outcomes. While many studies have identified strong associations between specific SDoH and health outcomes, little is known about how SDoH co-occur to form subtypes critical for designing targeted interventions. Such analysis has only now become possible through the <italic>All of Us</italic> program.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to analyze the <italic>All of Us</italic> dataset for addressing two research questions: (1) What are the range of and responses to survey questions related to SDoH? and (2) How do SDoH co-occur to form subtypes, and what are their risks for adverse health outcomes?</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>For question 1, an expert panel analyzed the range of and responses to SDoH questions across 6 surveys in the full <italic>All of Us</italic> dataset (N=372,397; version 6). For question 2, due to systematic missingness and uneven granularity of questions across the surveys, we selected all participants with valid and complete SDoH data and used inverse probability weighting to adjust their imbalance in demographics. Next, an expert panel grouped the SDoH questions into SDoH factors to enable more consistent granularity. To identify the subtypes, we used bipartite modularity maximization for identifying SDoH biclusters and measured their significance and replicability. Next, we measured their association with 3 outcomes (depression, delayed medical care, and emergency room visits in the last year). Finally, the expert panel inferred the subtype labels, potential mechanisms, and targeted interventions.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The question 1 analysis identified 110 SDoH questions across 4 surveys covering all 5 domains in <italic>Healthy People 2030</italic>. As the SDoH questions varied in granularity, they were categorized by an expert panel into 18 SDoH factors. The question 2 analysis (n=12,913; <italic>d</italic>=18) identified 4 biclusters with significant biclusteredness (<italic>Q</italic>=0.13; random-<italic>Q</italic>=0.11; <italic>z</italic>=7.5; <italic>P</italic>&lt;.001) and significant replication (real Rand index=0.88; random Rand index=0.62; <italic>P</italic>&lt;.001). Each subtype had significant associations with specific outcomes and had meaningful interpretations and potential targeted interventions. For example, the <italic>Socioeconomic barriers</italic> subtype included 6 SDoH factors (eg, <italic>not employed</italic> and <italic>food insecurity</italic>) and had a significantly higher odds ratio (4.2, 95% CI 3.5-5.1; <italic>P</italic>&lt;.001) for depression when compared to other subtypes. The expert panel inferred implications of the results for designing interventions and health care policies based on SDoH subtypes.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study identified SDoH subtypes that had statistically significant biclusteredness and replicability, each of which had significant associations with specific adverse health outcomes and with translational implications for targeted SDoH interventions and health care policies. However, the high degree of systematic missingness requires repeating the analysis as the data become more complete by using our generalizable and scalable machine learning code available on the <italic>All of Us</italic> workbench.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>social determinants of health</kwd>
        <kwd>All of Us</kwd>
        <kwd>bipartite networks</kwd>
        <kwd>financial resources</kwd>
        <kwd>health care</kwd>
        <kwd>health outcomes</kwd>
        <kwd>precision medicine</kwd>
        <kwd>decision support</kwd>
        <kwd>health industry</kwd>
        <kwd>clinical implications</kwd>
        <kwd>machine learning methods</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Social determinants of health (SDoH), such as financial resources [<xref ref-type="bibr" rid="ref1">1</xref>] and housing stability [<xref ref-type="bibr" rid="ref2">2</xref>], account for between 30% and 55% of people’s health outcomes [<xref ref-type="bibr" rid="ref3">3</xref>]. While many studies have identified strong associations between specific SDoH and health outcomes, most people experience multiple SDoH concurrently in their daily lives [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. For example, limited access to education, unstable employment, and lack of access to health care tend to frequently co-occur across individuals, leading to long-term stress and depression [<xref ref-type="bibr" rid="ref8">8</xref>]. Such complex interactions among multiple SDoH make it critical to analyze combinations of SDoH versus single factors. However, analysis of such co-occurrences and their risks of adverse health outcomes requires the integration of personal, clinical, social, and environmental information, critical for designing cost-effective and targeted interventions. Unfortunately, the lack of databases containing such multiple datatypes from the same individuals has resulted in a fragmented understanding of how SDoH co-occur and impact health, which is critical for designing targeted interventions.</p>
        <p>The <italic>All of Us</italic> program [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>] provides an unprecedented opportunity to address this fragmented view of SDoH. This program aims to collect data from multiple sources related to 1 million or more individuals, with a focus on populations that have been traditionally underrepresented in biomedical research. These data sources include electronic health records (EHRs), health surveys, whole-sequence genome data, physical measurements, and personal digital information. Critically, <italic>All of Us</italic> provides several survey modules containing a wide range of SDoH-related questions, which, in combination with other data sources, could transform our understanding of high-risk combinations of SDoH [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
        <p>However, little is known about the range of and responses to SDoH questions in <italic>All of Us</italic> and how they co-occur to form subtypes, which are critical for designing targeted interventions. To address these gaps, we characterized 110 SDoH in <italic>All of Us</italic>, which guided the methods we used to analyze how they co-occur to form subtypes and their risk of adverse health outcomes. The results helped highlight the opportunities and challenges for conducting subtype analysis in <italic>All of Us</italic>, which integrates multiple datatypes through the use of scalable and generalizable machine learning methods aimed at designing targeted interventions.</p>
      </sec>
      <sec>
        <title>Models and Research Related to SDoH</title>
        <p>The World Health Organization defines SDoH as the “non-medical factors that influence health outcomes” [<xref ref-type="bibr" rid="ref3">3</xref>]. Specifically, these include the conditions in which people are born, grow, work, live, and age. Furthermore, such conditions are shaped by a wider set of forces, such as economic and social policies, and systems, such as discriminatory laws and structural racism.</p>
        <p>Several models have proposed the factors and mechanisms involved in SDoH [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. These models were motivated by the concept of <italic>social gradient</italic> [<xref ref-type="bibr" rid="ref13">13</xref>], an empirical phenomenon observed within and across nations [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>] consistently showing that the lower an individual’s socioeconomic position, the worse their health. To help explain the factors underlying the social gradient, the model by Dahlgren and Whitehead [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref16">16</xref>] proposed several interconnected layers of social determinants that influence health. As shown in <xref rid="figure1" ref-type="fig">Figure 1</xref> [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref16">16</xref>], the innermost layer comprises demographic and genetic factors, which are largely unmodifiable. In contrast, the outer layers are modifiable to different degrees, such as lifestyle (eg, exercise and smoking); social and community networks (eg, contact with supportive friends and family); living and working conditions (eg, access to health care and employment); and broader socioeconomic, cultural, and environmental conditions (eg, crime in the neighborhood). While this model was not intended to provide explicit testable hypotheses [<xref ref-type="bibr" rid="ref4">4</xref>], the factors within each layer are expected to co-occur and impact each other in addition to responding to external forces such as systemic racism and capitalism when it is focused on financial profits at the expense of societal benefits.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>The Dahlgren-Whitehead conceptual model aimed at visually showing the interrelated layers of social determinant of health domains that influence health (reproduced from Dahlgren and Whitehead, 2021).</p>
          </caption>
          <graphic xlink:href="jmir_v27i1e48775_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>These early SDoH models motivated numerous studies [<xref ref-type="bibr" rid="ref17">17</xref>] that analyzed associations among specific SDoH (eg, immigration status and home density [<xref ref-type="bibr" rid="ref7">7</xref>]), their association with health outcomes (eg, education and mortality [<xref ref-type="bibr" rid="ref18">18</xref>]), and how they manifest within subpopulations (eg, patients with diabetes [<xref ref-type="bibr" rid="ref19">19</xref>]). More recently, organizations such as the Centers for Disease Control and Prevention and <italic>Healthy People 2030</italic> (HP-30) have classified these empirical results into SDoH domains that roughly map to the Dahlgren-Whitehead model. For example, HP-30 organized SDoH empirical studies into five SDoH domains: (1) economic stability, (2) education access and quality, (3) health care access and quality, (4) neighborhood and built environment, and (5) social and community context. Furthermore, the PhenX program (which provides well-established measurement protocols for use in biomedical and translational research) has identified SDoH data collection protocols to enable more systematic data collection and analysis [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref22">22</xref>].</p>
        <p>While the aforementioned findings and categorizations have greatly improved our understanding of SDoH and their impact on health, they have been mostly analyzed based on snapshots of associations between a few factors and health outcomes. In contrast, SDoH models and recent empirical studies suggest that multiple SDoH tend to co-occur and impact each other. For example, during the pandemic, Hispanic and Black or African American individuals not only had a higher exposure to COVID-19 due to their frontline jobs and overcrowded living conditions but also had a higher risk of serious infections due to previous health conditions not addressed due to lack of health care access [<xref ref-type="bibr" rid="ref4">4</xref>]. Similarly, undocumented immigrants with lower incomes living in neighborhoods with high pollution, combined with the stress of deportation, have an increased risk of multiple chronic conditions such as depression and lung cancer [<xref ref-type="bibr" rid="ref7">7</xref>]. Such studies have resulted in the Centers for Medicare and Medicaid Services emphasizing that SDoH are a multilevel construct that includes both individual and contextual factors that have complex interactions [<xref ref-type="bibr" rid="ref23">23</xref>]. Furthermore, a distinction has been made between the aforementioned SDoH at the community level and social needs at the individual level [<xref ref-type="bibr" rid="ref24">24</xref>]. However, while this distinction is critical when designing care pathways, there is growing consensus [<xref ref-type="bibr" rid="ref25">25</xref>] that SDoH is an umbrella term that covers both levels, and it is an approach that has been adopted by both the PhenX Toolkit [<xref ref-type="bibr" rid="ref21">21</xref>] and the <italic>All of Us</italic> surveys on SDoH widely used for analysis [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>]. Therefore, we use <italic>SDoH</italic> to include all levels of nonmedical factors that impact health and well-being.</p>
        <p>The aforementioned co-occurrences of multiple SDoH and their impact on health directly reflect the interconnected layers of the Dahlgren-Whitehead model shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>. However, analysis of such co-occurrences and their health outcomes requires large datasets with multiple datatypes that have only recently been made available through the <italic>All of Us</italic> program.</p>
      </sec>
      <sec>
        <title>All of Us: Multiple Datatypes Across a Large Cohort of Underrepresented Americans</title>
        <p>The <italic>All of Us</italic> research program [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>] (<italic>All of Us</italic>), funded by the National Institutes of Health since 2015, aims to accelerate biomedical research to enable discoveries leading to individualized and equitable prevention and treatment. Such research is currently hampered due to the <italic>limited range</italic> of personal, clinical, social, and environmental variables available for the same individuals; <italic>limited representation</italic> in research datasets of socially marginalized populations; and <italic>limited access</italic> to individual-level data due to privacy laws.</p>
        <p>To overcome these hurdles, <italic>All of Us</italic> provides three critical features: (1) a data repository that is projected to contain 1 million or more participants with data from multiple sources, including EHRs, health surveys, whole-sequence genomic data, physical measurements, and personal digital information such as from Fitbit trackers; (2) a cohort targeted to include 75% of participants from populations underrepresented in research (race, ethnicity, gender, sex, sexual orientation, and disability) oversampled from the US population; and (3) strictly enforced rules to prevent reidentification of participants by disallowing the download of any participant data or reporting of research results for subgroups of &lt;20. These rules allow for analysis of the <italic>All of Us</italic> data to be categorized as non–human subjects research, which, combined with training and personal authentication by researchers, has resulted in a substantial reduction in administrative hurdles.</p>
        <p>As of December 30, 2022 (Controlled Tier; version 6), <italic>All of Us</italic> contained 372,397 total participants, with 8.6% who had attempted all 9 health surveys (7 related to demographics and general health and 2 related to COVID-19) and 26.5% who had genomic data. Critical to this study is the recent addition of a survey specifically targeted to SDoH questions, which has been attempted by 15.5% in the <italic>All of Us</italic> cohort. A preliminary analysis revealed that SDoH appear to be distributed across multiple health surveys and EHR codes, with participants providing those data at different times on a rolling basis. However, little is known about the range of and responses to SDoH questions in <italic>All of Us</italic> and how SDoH co-occur to form subtypes, a critical step for selecting the methods to identify and interpret SDoH subtypes.</p>
      </sec>
      <sec>
        <title>Computational Methods to Identify and Interpret Subtypes</title>
        <p>A wide range of studies [<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref34">34</xref>] on topics ranging from molecular to environmental determinants of health have shown that most humans tend to share a subset of characteristics (eg, comorbidities, symptoms, and genetic variants), forming distinct subtypes (also referred to as <italic>subgroups</italic> or <italic>subphenotypes</italic> depending on the condition and variables analyzed). A primary goal of precision medicine is to identify such subtypes and infer their underlying disease processes to design interventions targeted to those processes [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. Methods to identify subtypes include (1) investigator-selected variables such as race for developing hierarchical regression models [<xref ref-type="bibr" rid="ref36">36</xref>] or assigning patients to different arms of a clinical trial, (2) existing classification systems such as the Medicare Severity Diagnosis Related Group [<xref ref-type="bibr" rid="ref37">37</xref>] to assign patients to a disease category for purposes of billing, and (3) computational methods such as classification [<xref ref-type="bibr" rid="ref38">38</xref>-<xref ref-type="bibr" rid="ref40">40</xref>] and clustering [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref41">41</xref>] to discover subtypes.</p>
        <p>Several studies have used computational methods to identify subtypes, each with critical trade-offs. Some studies have used <italic>combinatorial</italic> approaches [<xref ref-type="bibr" rid="ref42">42</xref>] (eg, identify all pairs, all triples, and so on), which are intuitive but which can lead to a combinatorial explosion (eg, enumerating combinations of the 31 Elixhauser comorbidities would lead to 2<sup>31</sup> or 2,147,483,648 combinations), with most combinations not incorporating the full range of symptoms (eg, the most frequent pair of symptoms ignores what other symptoms exist in the profile of patients with that pair). Other studies have used <italic>unipartite</italic> clustering methods [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>] (clustering patients or comorbidities but not both together), such as k-means and hierarchical clustering, and dimensionality reduction methods, such as principal component analysis, to help identify clusters of frequently co-occurring comorbidities [<xref ref-type="bibr" rid="ref42">42</xref>-<xref ref-type="bibr" rid="ref48">48</xref>]. However, such methods have well-known limitations, including the requirement of inputting user-selected parameters (eg, similarity measures and the number of expected clusters) in addition to the lack of a quantitative measure to describe the quality of the clustering (critical for measuring the statistical significance of the clustering). Furthermore, because these methods are unipartite, there is no agreed-upon method to identify the patient subgroup defined by a cluster of variables, and vice versa.</p>
        <p>More recently, bipartite network analysis [<xref ref-type="bibr" rid="ref49">49</xref>] (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref50">50</xref>-<xref ref-type="bibr" rid="ref55">55</xref>] for additional details) has been used to address the aforementioned limitations by automatically identifying <italic>biclusters</italic> consisting of patients and characteristics simultaneously. This method takes as input any dataset, such as <italic>All of Us</italic> participants and their SDoH, and outputs a quantitative and visual description of biclusters (containing both participant subgroups and their frequently co-occurring SDoH). The quantitative output generates the number and members of the biclusters, in addition to the statistical significance of the biclusteredness [<xref ref-type="bibr" rid="ref50">50</xref>-<xref ref-type="bibr" rid="ref52">52</xref>], and the visual output displays the quantitative information of the biclusters through a network visualization [<xref ref-type="bibr" rid="ref53">53</xref>-<xref ref-type="bibr" rid="ref55">55</xref>]. Therefore, bipartite network analysis enables (1) the automatic identification of biclusters and the significance of their biclusteredness and (2) the visualization of the biclusters critical for their clinical interpretability. Furthermore, the attributes of participants in a subgroup can be used to measure the subgroup risk of an adverse health outcome, develop classifiers for categorizing a new participant into one or more of the subgroups, and develop a predictive model that uses that subgroup membership for measuring the risk of an adverse health outcome for the classified participant.</p>
        <p>However, while several studies [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref56">56</xref>-<xref ref-type="bibr" rid="ref63">63</xref>] have demonstrated the usefulness of bipartite networks for the identification and clinical interpretation of subgroups, there has been no systematic attempt to identify SDoH subtypes, mainly because of the lack of large cohorts containing a wide coverage of SDoH. The <italic>All of Us</italic> program provides an opportunity to use bipartite networks for the identification and interpretation of SDoH subtypes using a wide range of variables in a large cohort and for analyzing their risk of adverse health outcomes, a critical step in advancing precision medicine.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Research Questions</title>
        <p>Our analysis was guided by two research questions targeting the <italic>All of Us</italic> dataset:</p>
        <list list-type="order">
          <list-item>
            <p>What are the range of and responses to survey questions related to SDoH?</p>
          </list-item>
          <list-item>
            <p>How do SDoH co-occur to form subtypes, and what are their risks for adverse health outcomes?</p>
          </list-item>
        </list>
      </sec>
      <sec>
        <title>Expert Panel</title>
        <p>The selection of the research questions, variables, cohort, methods, and results and their interpretation were guided by an expert panel consisting of SDoH researchers with a professional background in applied demography, gerontology, and rehabilitation who worked closely with the machine learning and biostatistics researchers. The overall project and manuscript were examined by an ethicist for bias, stigma, and perpetuation of stereotypes. Therefore, the examination of each step in the project was aligned with the human-centered artificial intelligence approach [<xref ref-type="bibr" rid="ref64">64</xref>-<xref ref-type="bibr" rid="ref66">66</xref>].</p>
      </sec>
      <sec>
        <title>Data Description</title>
        <sec>
          <title>Study Population</title>
          <p>For question 1, we analyzed the full <italic>All of Us</italic> cohort (N=372,397) and characterized their responses to all the SDoH questions identified by the expert panel (described in the <italic>Variables</italic> section). For question 2, we analyzed all participants (n=12,913) who had valid responses to the SDoH questions identified in question 1 and used them to identify subtypes and their risks of specific outcomes.</p>
        </sec>
        <sec>
          <title>Variables</title>
          <p>For question 1, the expert panel was asked to review all 1113 questions across 6 <italic>All of Us</italic> non–COVID-19 health surveys, each of which was attempted once per participant (<italic>The Basics</italic>, <italic>Lifestyle</italic>, <italic>Overall Health</italic>, <italic>Personal/Family Health History</italic>, <italic>Health Care Access and Utilization</italic>, and <italic>SDoH</italic>), and the 2843 Systematized Medical Nomenclature of Medicine (SNOMED) codes related to SDoH [<xref ref-type="bibr" rid="ref67">67</xref>]. The expert panel arrived at a consensus for the SDoH across the surveys and the SNOMED codes. As the SDoH-related SNOMED codes in the EHRs had very low use (see <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> for a characterization), they were not further analyzed.</p>
          <p>For question 2, to identify and analyze the SDoH subtypes, we used the following variables:</p>
          <list list-type="order">
            <list-item>
              <p>Independent variables included the SDoH factors identified from question 1.</p>
            </list-item>
            <list-item>
              <p>Covariates included 3-digit zip code (to determine whether participants in each subtype came from a state that accepted Medicaid expansion, providing greater access to health insurance) and demographics (eg, age, sex, and race).</p>
            </list-item>
            <list-item>
              <p>A total of 3 outcomes were included: <italic>depression</italic>, <italic>delayed medical care</italic>, and <italic>emergency room (ER) visits in the last year</italic>. <italic>Depression</italic> was selected as it is a common health outcome when individuals encounter SDoH in their daily lives, such as long-term stress resulting from racism [<xref ref-type="bibr" rid="ref68">68</xref>], and the dysregulation of the hypothalamic-pituitary-adrenal axis [<xref ref-type="bibr" rid="ref69">69</xref>]. Depression was defined as having a positive response to both of the following questions in <italic>The Basics</italic> survey—“Are you still seeing a doctor or health care provider for depression?” and “Has a doctor or health care provider ever told you that you have Depression?”—or having SNOMED codes related to depression in their EHRs (35489007, 36923009, 370143000, 191616006, or 66344007). <italic>Delayed medical care</italic> was selected as it often results from the lack of medical insurance, which can impact the use of medical care when needed, leading to poorer health outcomes [<xref ref-type="bibr" rid="ref70">70</xref>]. Delayed medical care was defined as having one or more positive responses to 9 survey questions (delayed care due to transportation, rurality, nervousness, work, childcare, copay, older adult care, out-of-pocket costs, and deductible costs) in the <italic>Health Care Access</italic> and <italic>Utilization</italic> survey. <italic>Emergency room (ER) visits in the last year</italic> was selected because lack of medical insurance often results in individuals not seeking early medical care when needed, leading to an exacerbation of conditions precipitating one or more ER visits [<xref ref-type="bibr" rid="ref71">71</xref>]. As the survey questions that we used for SDoH subtyping were based on outcomes in the previous year, we defined ER visits for a participant as having one or more ER visits (current procedural terminology 99281-99285) 1 year preceding the date when the SDoH survey was completed.</p>
            </list-item>
          </list>
        </sec>
      </sec>
      <sec>
        <title>Analytical Approach</title>
        <sec>
          <title>Question 1: What Are the Range of and Responses to Survey Questions Related to SDoH?</title>
        </sec>
        <sec>
          <title>Identification and Coding of SDoH</title>
          <p>To analyze the range and responses to the survey questions, we first characterized all SDoH in <italic>All of Us</italic> at two levels of granularity—(1) SDoH questions based on the surveys used to collect the data and (2) SDoH factors, which were categories of the SDoH questions to form a coarser-grained classification (see <xref rid="figure2" ref-type="fig">Figure 2</xref>, which explains SDoH questions, factors, and subtypes).</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Examples showing how the social determinants of health (SDoH) questions from the <italic>All of Us</italic> surveys that differed in their levels of granularity were transformed by the expert panel into SDoH factors with uniform granularity to ensure consistency for analysis and interpretation and clustered into SDoH subtypes through machine learning. The SDoH questions and factors were subsequently analyzed for coverage across the 5 Healthy People 2030 domains.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e48775_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <p>To identify the SDoH questions, members of the expert panel independently used their domain knowledge about SDoH to identify and code the SDoH questions and examine their range with respect to the 5 HP-30 domains using the following steps: (1) reviewed all 1113 questions across 6 health surveys (excluding 2 related to COVID-19) and extracting all SDoH questions that were relevant, (2) transformed all positive or value-free questions into negative phrases and abbreviating them for interpretability in the graphs (eg, <italic>How often do you have someone help you read health-related materials?</italic> was changed to <italic>No one to help read health materials</italic>), (3) reverse coded and dichotomized the abbreviated SDoH questions (eg, always or often=1 and never, occasionally, or sometimes=0), and (4) categorized the SDoH questions into 1 of the 5 HP-30 SDoH domains (economic stability, education access and quality, health care access and quality, neighborhood and built environment, and social and community context). The expert panel subsequently met and collaboratively resolved any differences among their coding schemes to arrive at a consensus (see <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref> for the 110 SDoH questions and their consensus coding by the expert panel).</p>
          <p>To characterize the SDoH factors, the expert panel arrived at a consensus to categorize one or more of the aforementioned SDoH questions in <italic>All of Us</italic> into SDoH factors and examined their range with respect to HP-30 using the following steps: (1) reviewed the subgrouping labels of questions in the <italic>All of Us</italic> surveys and integrating them to categorize the SDoH into factors, (2) coded a participant as having a “1” for an SDoH factor if they answered one or more of the questions within that factor with a “1,” and (3) categorized the SDoH factors into 1 of the 5 HP-30 SDoH domains (economic stability, education access and quality, health care access and quality, neighborhood and built environment, and social and community context; see <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref> for the 110 SDoH questions, their consensus coding into 19 SDoH factors, and mapping to the 5 SDoH domains from HP-30).</p>
        </sec>
        <sec>
          <title>Analysis of the Range and Responses to SDoH Questions and Factors</title>
          <p>The aforementioned knowledge-based classification of SDoH questions and SDoH factors was analyzed to examine their range (with respect to the 5 HP-30 domains) and their responses (across all participants in <italic>All of Us</italic>) using the following four methods: (1) bar graph displaying the number of participants who had valid answers (all responses other than “skip” or “choose not to answer”) to each of the SDoH questions, sorted by survey based on mean response, and then sorted by raw response within each survey. Finally, to analyze their range, each bar was colored to denote one of the 5 SDoH domains defined by HP-30; (2) Venn diagram showing how many participants had cross-sectionally valid responses to all identified SDoH questions or factors; (3) table describing the number and proportion of race, ethnicity, sex, gender, and age between those who answered the SDoH questions or factors and those who did not have valid responses; and (4) frequency distribution of the number of SDoH questions or factors across participants who had valid responses for all the SDoH questions. The aforementioned plots are shown in the <italic>Results</italic> section.</p>
        </sec>
        <sec>
          <title>Question 2: How Do SDoH Co-Occur to Form Subtypes, and What Are their Risks for Adverse Health Outcomes?</title>
          <sec>
            <title>Data</title>
            <p>We used the cohort identified in question 1 (participants who had valid answers to all the SDoH questions). However, examination of the SDoH questions revealed that some of them (eg, <italic>cannot afford dental care</italic> and <italic>cannot afford prescriptions</italic>) had a finer level of granularity compared to others (eg, single household). As the questions with a finer level of granularity tend to be more strongly corelated to each other in comparison to other coarser-grained questions, they also tend to cluster together more strongly, confounding the interpretation of the subtypes. In contrast, as the SDoH factors had a more uniform granularity and were at a level of abstraction that was appropriate to guide referral to the proper social services, we used them to identify the SDoH subtypes.</p>
          </sec>
          <sec>
            <title>Analytical Model</title>
            <sec>
              <title>Overview</title>
              <p>To identify SDoH subtypes, their associations with outcomes and covariates, and their future translation into precision medicine and public policies, we used a 3-part analytical framework called heterogenization, integration, and translation (HIT). As shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>, the <italic>heterogenization</italic> step was used to identify the subtypes through the use of bipartite modularity maximization [<xref ref-type="bibr" rid="ref50">50</xref>-<xref ref-type="bibr" rid="ref52">52</xref>] (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for more details), the <italic>integration</italic> step was used to measure the association of each subtype with multiple datatypes [<xref ref-type="bibr" rid="ref72">72</xref>], and the <italic>translation</italic> step was used to qualitatively interpret the subtypes [<xref ref-type="bibr" rid="ref72">72</xref>] with the goal of developing in the future a decision support system to translate the subtypes into clinical practice and the design of public policies. The following sections describe the specific methods used in each of the HIT steps.</p>
              <fig id="figure3" position="float">
                <label>Figure 3</label>
                <caption>
                  <p>The three steps of the heterogenization, integration, and translation framework to analyze social determinants of health (SDoH): (1) heterogenization of the data to identify subtypes, (2) integration of multiple datatypes such as from electronic health records (eg, depression) and information on state of residency (eg, to determine Medicaid expansion) to determine the risk and enrichment of each subtype, and (3) translation of subtypes through interpretation and predictive modeling with the goal of designing clinical decision support systems and public policy. SLC6A4: Serotonin Transporter Gene Polymorphism.</p>
                </caption>
                <graphic xlink:href="jmir_v27i1e48775_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
              </fig>
            </sec>
            <sec>
              <title>Heterogenization: Identification of Subtypes</title>
              <p>As there were many participants who did not have valid answers to the SDoH questions, dropping them resulted in differences in the proportion of demographic variables compared with the full <italic>All of Us</italic> cohort. Therefore, the data needed to be adjusted to better reflect the overall <italic>All of Us</italic> participants. To adjust the demographic distribution of the cohort to match the full <italic>All of Us</italic> cohort, we used inverse probability weighting (IPW) [<xref ref-type="bibr" rid="ref73">73</xref>,<xref ref-type="bibr" rid="ref74">74</xref>]. IPW calculates weights to proportionally boost the values of participants who are underrepresented in a cohort with respect to a comparison, such as the full <italic>All of Us</italic> dataset, using a method similar to that of an earlier study on <italic>All of Us</italic> [<xref ref-type="bibr" rid="ref75">75</xref>] (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>). Next, we multiplied the IPW-generated weights with the original binary values for each participant in our cohort and used the min-max method to range-normalize those weights within each SDoH factor. Finally, to test the replicability of the SDoH factor biclustering, we randomly divided the dataset into a training and a replication dataset.</p>
              <p>We identified subtypes in the training dataset and tested the degree to which the SDoH factor co-occurrences were replicated in the replication dataset using the following steps: (1) modeled participants and SDoH factors as a weighted bipartite network (step 1 in <xref rid="figure3" ref-type="fig">Figure 3</xref>) where nodes were either participants (circles) or SDoH factors (triangles) and the associations between participant–SDoH factor pairs were weighted edges (lines) generated from IPW (the inclusion of IPW-generated weights enabled the network to represent the demographic distribution of the full <italic>All of Us</italic> dataset), (2) used a bipartite modularity maximization algorithm [<xref ref-type="bibr" rid="ref50">50</xref>-<xref ref-type="bibr" rid="ref52">52</xref>] (which takes edge weights into consideration) to identify the number of biclusters and their members and measure the degree of biclusteredness through bicluster modularity (<italic>Q</italic>, defined as the fraction of edges falling within a cluster minus the expected fraction of such edges in a network of the same size with randomly assigned edges), (3) measured the significance of <italic>Q</italic> by comparing it to a distribution of the same quantity generated from 1000 random permutations of the network while preserving the network size (number of nodes) and the distribution of weighted edges for each participant, (4) used the Rand index (RI) to measure the degree to which SDoH occurred and did not co-occur in the same cluster in the training and replication datasets, and (5) measured the significance of the RI by comparing it to the mean of a distribution of the same quantity generated by randomly permuting the training and replication datasets 1000 times while preserving the size of the networks and the distribution of weighted edges for each participant.</p>
            </sec>
            <sec>
              <title>Integration: Risk and Enrichment of Subtypes</title>
              <p>We used logistic regression to measure the odds ratio (OR) for each subtype compared pairwise to each of the other subtypes for the 3 outcomes (depression, delayed medical care, and ER visits in the last year) and for living in a state with no Medicaid expansion. To adjust for the difference in demographics due to the missingness, we used weights generated from IPW for each participant, and the comparisons were adjusted for demographics (eg, age, sex, and race) and corrected for multiple testing within each outcome using false discovery rate. As 13.07% (1688/12,913) of the participants did not have 3-digit zip code information, we used IPW to measure the weights of the cohort and used them to account for potential sample selection bias.</p>
            </sec>
            <sec>
              <title>Translation: Interpretation of Subtypes</title>
              <p>The subtype interpretation was done using the following steps: (1) used the <italic>Fruchterman-Reingold</italic> [<xref ref-type="bibr" rid="ref53">53</xref>] and <italic>ExplodeLayout</italic> [<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref55">55</xref>] algorithms to visualize the bipartite network along with the risk of each of the outcomes; (2) asked the expert panel to independently label the subtypes, infer the mechanisms that increase the risks in each subtype for the 3 outcomes (depression, delayed medical care, and ER visits in the last year) with potential strategies to reduce those risks, and then collaboratively come to a consensus; and (3) asked an ethicist to examine the results and their interpretations for bias, stigma, and perpetuation of stereotypes.</p>
            </sec>
          </sec>
        </sec>
        <sec>
          <title>Ethical Considerations</title>
          <p>The original data collection by the <italic>All of Us</italic> program was approved by an institutional review board as described on the web [<xref ref-type="bibr" rid="ref76">76</xref>].</p>
          <p>The secondary analysis of the <italic>All of Us</italic> data conducted in this work did not receive approval or exemption from an institutional review board. Such an approval or exemption is not required as described on the web [<xref ref-type="bibr" rid="ref77">77</xref>].</p>
          <p>Therefore, the authors had permission to conduct a secondary analysis of the data.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Question 1: What Are the Range of and Responses to Survey Questions Related to SDoH?</title>
        <sec>
          <title>Identification and Coding of SDoH Questions and Factors</title>
          <p>The expert panel identified 110 questions from 4 surveys (<italic>The Basics</italic>, <italic>Overall Health</italic>, <italic>Healthcare Access and Utilization</italic>, and <italic>SDoH</italic>). Of these 110 questions, 110 (100%) were abbreviated, and 48 (43.6%) were negatively worded and coded (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). The 110 SDoH questions were further categorized into 19 SDoH factors (one of these was <italic>Delayed medical care</italic>, which was used as an outcome).</p>
        </sec>
        <sec>
          <title>Responses to SDoH Questions and Factors</title>
          <p>As shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>A, the number of valid responses to each of the 110 SDoH questions was largely dictated by the surveys in which the responses were solicited. SDoH from 2 surveys (<italic>The Basics</italic> and <italic>Overall Health</italic>) had the most valid responses (mean 349,434, SD 23,556), followed by <italic>Healthcare Access and Utilization</italic> (mean 149,898, SD 6146) and, finally, the <italic>SDoH</italic> survey (mean 55,960, SD 1083). This pattern of responses matched how answers to each of the surveys were solicited—at enrollment, all participants are required to do <italic>The Basics</italic> and <italic>Overall Health</italic> surveys, and then, on a rolling basis, responses to the other surveys are solicited. The <italic>SDoH</italic> survey was the last survey that was solicited, which explained it having the lowest number of responses. As shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>B, this pattern of missingness held for the responses at the SDoH factor level, which was not unexpected as the SDoH factors were aggregations of the SDoH questions. However, as shown in <xref rid="figure4" ref-type="fig">Figures 4</xref>A and 4B by the uneven number of valid responses within each survey block, there were several SDoH questions that had invalid responses (“skip” or “choose not to answer”) at both levels of granularity: <italic>The Basics</italic> (339,254/5,655,412, 5.99%), <italic>Healthcare Access and Utilization</italic> (341,516/5,587,957, 6.11%), <italic>Overall Health</italic> (32,669/744,126, 4.39%), and <italic>SDoH</italic> (83,699/3,206,035, 2.61%). Furthermore, the proportion of valid to invalid responses among them was significantly different for the SDoH questions (N=365,237, χ<sup>2</sup><sub>2</sub>=57.5; <italic>P</italic>&lt;.001) and for the SDoH factors (N=372,063, χ<sup>2</sup><sub>2</sub>=75.6; <italic>P</italic>&lt;.001).</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>The number of valid responses for (A) 110 social determinants of health (SDoH) questions and (B) 18 SDoH factors. The colors denote how the SDoH in each were categorized based on the 5 Healthy People 2030 (HP-30) domains. Rx: prescription medication.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e48775_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Range of SDoH Questions and Factors</title>
          <p>As shown by the colored bars in <xref rid="figure4" ref-type="fig">Figure 4</xref>, the surveys spanned the full range of the 5 SDoH HP-30 domains. The SDoH questions in <italic>The Basics</italic> and <italic>Overall Health</italic> surveys were predominantly related to economic stability (blue) and social and community context (purple), those in the <italic>Healthcare Access and Utilization</italic> survey were all related to that topic (green), whereas those from the <italic>SDoH</italic> survey were a mix of all 4 domains. Overall, the 4 surveys contained 110 SDoH questions that together had 100% coverage of the 5 HP-30 domains (social and community context: n=38, 34.5%; neighborhood and built environment: n=19, 17.3%; economic stability: n=10, 9.1%; education access and quality: n=2, 1.8%; health care access and quality: n=42, 38.2%). This characterization suggests that, while the SDoH in <italic>All of Us</italic> have broad domain coverage across the surveys, analysis of them requires access to all 4 surveys, each of which has different levels of completion and valid responses.</p>
        </sec>
        <sec>
          <title>Cohort With Maximized Valid Responses</title>
          <p>Given the large degree and systematic nature of missingness in 2 of the 4 surveys, we could not use multiple imputation to estimate the values. Therefore, we had to find a subset of participants who had valid responses to all the SDoH questions. An examination revealed that 2 SDoH questions had &lt;10% of responses (<italic>English verbal frequency</italic>: 6193/371,942, 1.67%; <italic>Neighborhood has no recreation spaces</italic>: 31,152/371,942, 8.38%), accounting for the largest loss in cohort size with valid responses. Therefore, these questions were dropped from further analysis. Furthermore, one question required a branched response (<italic>Living situation</italic> branching to <italic>Did not live in a house</italic>), and these responses were merged. Finally, as we used <italic>Delayed medical care</italic> as an outcome, 8.2% (9/110) of the questions related to that topic were removed, resulting in a total of 98 SDoH questions. As shown in <xref rid="figure5" ref-type="fig">Figure 5</xref>, a Venn diagram of the overlap among the valid responses across the surveys revealed that 3.47% (12,913/372,397) of the participants had valid responses to all 98 SDoH questions.</p>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>Venn diagram showing 3.47% (12,913/372,397) of participants of the full cohort who had valid responses to all 98 social determinants of health (SDoH) questions.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e48775_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Co-Occurrence of the Number of SDoH Across Responders</title>
          <p>As shown in <xref rid="figure6" ref-type="fig">Figure 6</xref>, participants had a median of 15 SDoH question co-occurrences and a median of 9 SDoH factor co-occurrences. Furthermore, participants of racial and ethnic minority groups who had valid responses to the 110 SDoH questions had a significantly higher median number of co-occurring SDoH compared to the equivalent White population (median 20 for participants of racial and ethnic minority groups; median 14 for White participants; <italic>P</italic>&lt;.001). These results show the high co-occurrences of SDoH at both levels of granularity, with a significant difference in median co-occurrences between the White participants and the participants of racial and ethnic minority populations with valid responses.</p>
          <fig id="figure6" position="float">
            <label>Figure 6</label>
            <caption>
              <p>Frequency distribution of (A) number of co-occurring responses to social determinant of health (SDoH) questions across the 12,913 participants with valid answers to the 98 SDoH questions and (B) number of co-occurring SDoH factors across 19 SDoH factors.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e48775_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Participant Demographics With Valid Responses to SDoH Questions</title>
          <p>As the cohort size dropped to 3.47% (12,913/372,397), we analyzed how that impacted the demographic distribution compared with the overall <italic>All of Us</italic> dataset. As shown in <xref ref-type="table" rid="table1">Table 1</xref>, there were statistically significant differences in race (N=372,397, χ<sup>2</sup><sub>5</sub>=2073.1; <italic>P</italic>&lt;.001) and ethnicity (N=372,397, χ<sup>2</sup><sub>9</sub>=6292.2; <italic>P</italic>&lt;.001) between the 2 cohorts after multiple testing correction, with a higher proportion of White participants having valid answers than participants of racial or ethnic minority groups. Furthermore, there was a statistically significant difference in age between the participants who had valid answers and those who did not (<italic>H</italic>1=148.08; <italic>P</italic>&lt;.001). These results show the demographic differences between the cohort with complete and valid answers to the SDoH questions and the full <italic>All of Us</italic> dataset, necessitating the use of IPW–generated weights to address those imbalances, as discussed in question 2.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>The demographic differences between the total <italic>All of Us</italic> (AoU) participants and those who had valid answers to all 110 social determinant of health (SDoH) questions (N=372,397). Participant counts of &lt;20 are shown as a count of 20 based on the AoU reporting rules.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="350"/>
              <col width="250"/>
              <col width="370"/>
              <thead>
                <tr valign="top">
                  <td colspan="2">Demographics</td>
                  <td>Total AoU participants</td>
                  <td>Total AoU participants with valid<sup>a</sup> SDoH answers (n=12,913)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="4">
                    <bold>Race, n (%)</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Asian</td>
                  <td>12,459 (3.35)</td>
                  <td>324 (2.51)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Black or African American</td>
                  <td>73,383 (19.71)</td>
                  <td>482 (3.73)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>White</td>
                  <td>201,149 (54.01)</td>
                  <td>11,279 (87.35)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Other or &gt;1 population</td>
                  <td>26,890 (7.22)</td>
                  <td>343 (2.66)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>None indicated</td>
                  <td>58,516 (15.71)</td>
                  <td>485 (3.76)</td>
                </tr>
                <tr valign="top">
                  <td colspan="4">
                    <bold>Ethnicity, n (%)</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Not Hispanic or Latino</td>
                  <td>288,227 (77.4)</td>
                  <td>12,095 (93.67)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Hispanic or Latino</td>
                  <td>66,704 (17.91)</td>
                  <td>751 (5.82)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Additional options</td>
                  <td>17,466 (4.69)</td>
                  <td>67 (0.52)</td>
                </tr>
                <tr valign="top">
                  <td colspan="4">
                    <bold>Sex at birth, n (%)</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Female</td>
                  <td>222,495 (59.75)</td>
                  <td>8236 (63.78)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Male</td>
                  <td>138,831 (37.28)</td>
                  <td>4674 (36.2)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Intersex</td>
                  <td>80 (0.02)</td>
                  <td>20 (0.15)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Additional options</td>
                  <td>10,991 (2.95)</td>
                  <td>20 (0.15)</td>
                </tr>
                <tr valign="top">
                  <td colspan="4">
                    <bold>Gender, n (%)</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Female</td>
                  <td>220,833 (59.3)</td>
                  <td>8113 (62.83)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Male</td>
                  <td>138,140 (37.09)</td>
                  <td>4642 (35.95)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Nonbinary</td>
                  <td>920 (0.25)</td>
                  <td>60 (0.46)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Transgender</td>
                  <td>464 (0.12)</td>
                  <td>20 (0.15)</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Additional options</td>
                  <td>12,040 (3.23)</td>
                  <td>79 (0.61)</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <bold>Age (y), median (range)</bold>
                  </td>
                  <td>56 (19-122<sup>b</sup>)</td>
                  <td>58 (19-93)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>Participants who completed all questions and did not skip or choose not to answer a question.</p>
              </fn>
              <fn id="table1fn2">
                <p><sup>b</sup>Age of 122 years=a participant chose the earliest birth year (1900).</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
      </sec>
      <sec>
        <title>Question 2: How Do SDoH Factors Co-Occur to Form Subtypes, and What Are Their Risks for Adverse Health Outcomes?</title>
        <sec>
          <title>Overview</title>
          <p>The cohort used to identify the subtypes consisted of 12,913 participants, of whom 12,886 (99.79%) had valid IPW–generated weights. The latter cohort was split randomly into the training and replication datasets, each with complete data for 18 SDoH factors (identified in question 1) in addition to the 3 outcomes (depression, delayed medical care, and ER visits in the last year) and covariates (demographics). The results are organized based on the 3 parts of the HIT framework described in <xref rid="figure3" ref-type="fig">Figure 3</xref>.</p>
        </sec>
        <sec>
          <title>Heterogenization: Identification of Subtypes</title>
          <p>The subtypes were identified by using a bipartite network where the edges were weighted using the IPW-generated weights to account for the imbalance in demographics between our cohort and the full <italic>All of Us</italic> dataset. The weighted bipartite network of the training dataset (n=6492) and the 18 SDoH factors revealed 4 biclusters with statistically significant bicluster modularity (<italic>Q</italic>=0.13; random-<italic>Q</italic>=0.11; <italic>z</italic>=7.5; <italic>P</italic>&lt;.001). As shown in <xref rid="figure7" ref-type="fig">Figure 7</xref>, there were 4 clusters with participant subgroups and their most frequently co-occurring SDoH factors (<italic>Cluster 1 [pink]</italic>: low educational attainment, low literacy, low income, not employed, food insecurity, and housing insecurity; <italic>Cluster 2 [green]</italic>: difficulty affording medical care, discriminatory experiences in everyday life, discriminatory experiences in medical settings, and poor interactions with providers; <italic>Cluster 3 [blue]</italic>: poor neighborhood cohesion and poor relationships with others; and <italic>Cluster 4 [gray]</italic>: language barrier, lack of health care coverage, mismatched provider characteristics, disadvantaged neighborhood characteristics, disadvantaged demographics, and low supportive relationships). These co-occurrences of SDoH factors were significantly replicated in the replication dataset (real RI=0.88; random RI=0.62; <italic>P</italic>&lt;.001). As shown in <xref rid="figure8" ref-type="fig">Figure 8</xref>, while the 18 SDoH factors have a hierarchical relationship with the 5 <italic>knowledge-driven</italic> HP-30 domains (shown on the left), those same SDoH factors have a more complex relationship with the 4 <italic>data-driven</italic> biclusters (shown on the right).</p>
          <fig id="figure7" position="float">
            <label>Figure 7</label>
            <caption>
              <p>A total of 4 biclusters in the training dataset consisting of subgroups of participants (n=6492) and their most frequently co-occurring social determinant of health (SDoH) factors (d=18).</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e48775_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure8" position="float">
            <label>Figure 8</label>
            <caption>
              <p>A total of 18 social determinant of health (SDoH) factors (center) have a hierarchical relationship with the 5 SDoH domains defined by Healthy People 2030 (HP-30; left), both of which are knowledge driven. In contrast, the data-driven analysis shows that SDoH factors have a complex relationship with the SDoH subtypes (right) identified through machine learning (ML), reflecting how they co-occur in the real world and aligned with models such as the Dahlgren-Whitehead model.</p>
            </caption>
            <graphic xlink:href="jmir_v27i1e48775_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Integration: Risk and Enrichment of Subtypes</title>
          <p><xref ref-type="table" rid="table2">Table 2</xref> shows the association of each subtype with the 3 outcomes. As shown by the italicized row, Cluster 1 (low educational attainment, low literacy, low income, not employed, food insecurity, and housing insecurity) had a significantly higher OR for each of the 3 outcomes than Cluster 4 (mismatched provider characteristics, disadvantaged neighborhood characteristics, lack of health care coverage, disadvantaged demographics, low supportive relationships, and language barriers). Furthermore, within the Depression outcome, each of the clusters had a significantly higher OR than one other cluster, forming a ranking of risk among all the 4 clusters (1&gt;3&gt;2&gt;4). In contrast, Delayed medical care had 2 other significant associations (2&gt;1 and 3&gt;4), with ER visits in the last year having only 1 significant pairwise association that fit into the overall trend.</p>
          <p>As shown in <xref ref-type="table" rid="table3">Table 3</xref>, this trend continued in the enrichment analysis of association with living in a state with <italic>No Medicaid expansion</italic>. As shown, Cluster 1 had a significantly higher OR than Cluster 4 in addition to having a significantly OR than the other clusters. The overall results suggest that Cluster 1 and Cluster 4 form “book ends” representing the high and low ends of the risk spectrum among the clusters.</p>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Cluster comparisons to measure the risk across all 3 outcomes. Cluster 1 had a significantly higher risk than Cluster 4 for all 3 outcomes (shown in italics). The depression outcome had a distinct ranking of risks, whereas the other 2 outcomes had a subset of that ranking. All <italic>P</italic> values shown are corrected for multiple testing.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="210"/>
              <col width="180"/>
              <col width="90"/>
              <col width="180"/>
              <col width="90"/>
              <col width="160"/>
              <col width="90"/>
              <thead>
                <tr valign="top">
                  <td>Cluster comparison</td>
                  <td colspan="6">Outcomes</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td colspan="2">Depression</td>
                  <td colspan="2">Delayed medical care</td>
                  <td colspan="2">ER<sup>a</sup> visits in the last year</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>OR<sup>b</sup> (95% CI)</td>
                  <td><italic>P</italic> value</td>
                  <td>OR (95% CI)</td>
                  <td><italic>P</italic> value</td>
                  <td>OR (95% CI)</td>
                  <td><italic>P</italic> value</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>1 vs 2</td>
                  <td>1.7 (1.5-2)</td>
                  <td>&lt;.001</td>
                  <td>0.78 (0.67-0.92)</td>
                  <td>.004<sup>c</sup></td>
                  <td>1.2 (0.91-1.6)</td>
                  <td>.24</td>
                </tr>
                <tr valign="top">
                  <td>1 vs 3</td>
                  <td>1.3 (1.1-1.6)</td>
                  <td>.02<sup>d</sup></td>
                  <td>0.88 (0.72-1.1)</td>
                  <td>.23</td>
                  <td>1.4 (0.96-1.9)</td>
                  <td>.13</td>
                </tr>
                <tr valign="top">
                  <td><italic>1</italic> vs <italic>4</italic></td>
                  <td>4.2 (3.5-5.1)</td>
                  <td>&lt;.001</td>
                  <td>3.5 (3-4.1)</td>
                  <td>&lt;.001</td>
                  <td>1.8 (1.4-2.3)</td>
                  <td>&lt;.001</td>
                </tr>
                <tr valign="top">
                  <td>2 <italic>vs</italic> 3</td>
                  <td>0.79 (0.64-0.97)</td>
                  <td>.02<sup>d</sup></td>
                  <td>1.2 (0.98-1.4)</td>
                  <td>.09</td>
                  <td>1 (0.75-1.5)</td>
                  <td>.80</td>
                </tr>
                <tr valign="top">
                  <td>2 vs 4</td>
                  <td>2.3 (1.9-2.7)</td>
                  <td>&lt;.001</td>
                  <td>4.3 (3.7-5)</td>
                  <td>&lt;.001</td>
                  <td>1.3 (1-1.7)</td>
                  <td>.12</td>
                </tr>
                <tr valign="top">
                  <td>3 vs 4</td>
                  <td>2.9 (2.3-3.5)</td>
                  <td>&lt;.001</td>
                  <td>3.6 (3-4.4)</td>
                  <td>&lt;.001</td>
                  <td>1.4 (0.95-1.9)</td>
                  <td>.13</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table2fn1">
                <p><sup>a</sup>ER: emergency room.</p>
              </fn>
              <fn id="table2fn2">
                <p><sup>b</sup>OR: odds ratio.</p>
              </fn>
              <fn id="table2fn3">
                <p><sup>c</sup><italic>P</italic>&lt;.01.</p>
              </fn>
              <fn id="table2fn4">
                <p><sup>d</sup><italic>P</italic>&lt;.05.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <table-wrap position="float" id="table3">
            <label>Table 3</label>
            <caption>
              <p>Cluster 1 had a significantly higher odds ratio (OR) than Cluster 4 (shown in italics) for No Medicaid expansion in addition to having a higher OR than Cluster-2 and Cluster-3. All <italic>P</italic> values shown are corrected for multiple testing.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="360"/>
              <col width="410"/>
              <col width="230"/>
              <thead>
                <tr valign="top">
                  <td>Cluster comparison</td>
                  <td colspan="2">Enrichment—No Medicaid expansion</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>OR (95% CI)</td>
                  <td><italic>P</italic> value</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>1 vs 2</td>
                  <td>1.5 (1.3-1.8)</td>
                  <td>&lt;.001</td>
                </tr>
                <tr valign="top">
                  <td>1 vs 3</td>
                  <td>1.3 (1-1.6)</td>
                  <td>.048<sup>a</sup></td>
                </tr>
                <tr valign="top">
                  <td>
                    <italic>1 vs 4</italic>
                  </td>
                  <td>
                    <italic>1.3 (1.1-1.5)</italic>
                  </td>
                  <td>
                    <italic>.006</italic>
                    <sup>b</sup>
                  </td>
                </tr>
                <tr valign="top">
                  <td>2 vs 3</td>
                  <td>0.99 (0.8-1.2)</td>
                  <td>.97</td>
                </tr>
                <tr valign="top">
                  <td>2 vs 4</td>
                  <td>0.99 (0.86-1.2)</td>
                  <td>.97</td>
                </tr>
                <tr valign="top">
                  <td>3 vs 4</td>
                  <td>1 (0.82-1.2)</td>
                  <td>.97</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table3fn1">
                <p><sup>a</sup><italic>P</italic>&lt;.05.</p>
              </fn>
              <fn id="table3fn2">
                <p><sup>b</sup><italic>P</italic>&lt;.01.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Translation: Interpretation of SDoH Subtypes and Design of Potential Interventions</title>
          <p>The expert panel examined the co-occurrences of SDoH factors within each bicluster shown in the network visualization (<xref rid="figure7" ref-type="fig">Figure 7</xref>) and integrated them with the quantitative ORs in <xref ref-type="table" rid="table2">Tables 2</xref> and <xref ref-type="table" rid="table3">3</xref>. The consistent “book ends” result where Cluster 1 had significantly higher ORs than Cluster 4 across all 4 variables was of strong interest and interpreted as follows: (1) Cluster 1 was labeled <italic>Socioeconomic barriers</italic> as it comprised multiple high-risk SDoH. These co-occurring SDoH could have resulted from cascades over time, such as low educational attainment, potentially leading to lower rates of employment and lower income with higher rates of food and housing insecurity. Such cascading factors can be perceived as being relatively unmodifiable, leading to a higher risk of chronic stress and depression. Furthermore, the strong association of this subtype with the outcomes <italic>Delayed medical care</italic> and <italic>ER visits in the last tear</italic> and the fact that participants in this subtype were more likely to be from a US state with <italic>No Medicaid expansion</italic> provided a more comprehensive understanding of this high-risk SDoH subtype; (2) Cluster 4 was labeled <italic>Sociocultural barriers</italic> as it contained a combination of SDoH related to disadvantaged neighborhood characteristics and low supportive relations in addition to language barriers and mismatched provider interactions. In contrast to the socioeconomic barriers in Cluster 1, many of the sociocultural barriers could be perceived as potentially modifiable, resulting in a lower risk of depression, delayed medical care, and ER visits. Participants who matched this profile could be screened for language and communication barriers, useful for providing culturally competent care, identifying providers who better match the profile of the individuals, and providing resources to facilitate contact with matching nationality or cultural groups in the vicinity or on the web.</p>
          <p>While Clusters 1 and 4 formed the “book ends” of risk across the 3 outcomes, potentially caused by relative differences in the unmodifiability of their frequently co-occurring SDoH, Cluster 2 was flagged as critical and labeled <italic>Lived experience barriers</italic>. The SDoH in this cluster included discriminatory experiences in everyday life and in medical settings in addition to poor interactions with providers and difficulty affording medical care. These frequently co-occurring SDoH could explain why this subtype had a significantly higher OR for <italic>Delayed medical care</italic> than Cluster 1. Finally, Cluster 3 was labeled <italic>Social context barriers</italic> as the SDoH were related to poor neighborhood cohesion and relationships with others. While not as critical as Clusters 1 and 2, this cluster still had a significantly higher OR for Depression than Cluster 4. Together, the 4 clusters could explain how different degrees of unmodifiability in frequently co-occurring SDoH might impact health outcomes.</p>
          <p>The expert panel and the ethicist concluded that clinicians treating patients who match each subtype profile could be alerted of specific risks and, consequently, motivate a discussion about mental health and consequences of delayed medical care with the goal of collaboratively exploring options and solutions with the patients. The results could also be useful for resource planning in hospitals to ensure that there is adequate staff to address the needs of the populations they serve, and for proposing health care policies to address the critical connection between specific combinations of SDoH and their impact on public health. For example, many health equity policies categorize Americans based on sociodemographic variables like race and income, which are proxies of need rather than the needs themselves. Instead, such policies could categorize Americans based on SDoH subtypes and their risks to more precisely allocate resources based on combinations of real-world needs.</p>
          <p>Furthermore, the subtypes did not have a one-to-one mapping to the 5 SDoH domains defined by HP-30. As shown in <xref rid="figure8" ref-type="fig">Figure 8</xref>, these data-driven clusters have a complex relationship with the SDoH domains and factors. While one subtype belonged to a single domain (the <italic>Social context</italic> subtype belonged to the <italic>Social and community context</italic> domain), 3 of the 4 subtypes belonged to ≥2 domains (eg, the <italic>Socioeconomic barriers</italic> subtype belonged to the <italic>Economic stability</italic> and <italic>Education access and quality</italic> domains). Such interdomain relationships reflect how SDoH co-occur in the real world, reflecting the complex cross-domain interactions described in the Dahlgren-Whitehead model (<xref rid="figure1" ref-type="fig">Figure 1</xref>). These relationships could be useful for refining conceptual models to explain the complex association between SDoH and adverse health outcomes and build more accurate SDoH models for predicting adverse health outcomes.</p>
        </sec>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>The mechanisms through which SDoH precipitate adverse health outcomes are complex, consisting of many interacting factors and feedback loops among individual and environmental and contextual factors. While this phenomenon has been studied for &gt;3 decades, critical hurdles for researchers have included the <italic>limited range</italic> of datatypes, <italic>limited representation</italic> of populations that have been socially marginalized, and <italic>limited access</italic> to individual-level data at scale due to privacy laws. Recognizing that <italic>All of Us</italic> has well-articulated plans and resources to overcome these limitations but is still in a rapidly evolving stage, we conducted a systematic characterization of &gt;100 SDoH survey questions available in <italic>All of Us</italic> and used them to identify SDoH subtypes with the future goal of designing targeted interventions.</p>
        <p>For question 1, we identified 110 SDoH questions across 4 surveys, which covered all 5 domains in HP-30. However, the results also revealed a large degree of missingness in survey responses (1.76%-84.56%), with later surveys having significantly fewer responses than earlier ones, and significant differences in race, ethnicity, and age of participants among those who completed the surveys with SDoH questions compared to those in the full <italic>All of Us</italic> dataset. Furthermore, as the SDoH questions varied in granularity, they were categorized by an expert panel into 18 SDoH factors. For question 2, the subtype analysis identified 4 biclusters with significant biclusteredness and significant replication. Furthermore, there were statistically significant associations between specific subtypes and the outcomes, as well as with Medicaid expansion, each with meaningful interpretations and potential targeted interventions. Finally, the identified subtypes spanned one or more HP-30 domains, revealing the difference between the current knowledge-based SDoH domains and the data-driven subtypes.</p>
        <p>While the results revealed the nature of and responses to SDoH questions in <italic>All of Us</italic> and significant and interpretable SDoH subtypes, the analysis revealed critical opportunities and challenges related to data, methods, and theory. Such insights are useful for future researchers conducting similar analyses on <italic>All of Us</italic> and, therefore, are discussed in the following sections.</p>
      </sec>
      <sec>
        <title>Data: Missingness and Granularity</title>
        <sec>
          <title>Missingness</title>
          <p>The analysis revealed 3 types of missingness. The first was <italic>rollout missingness</italic>. This type of missingness was largely dictated by how the surveys were rolled out to participants. As all participants at enrollment are required to do <italic>The Basics</italic> and <italic>Overall Health</italic> surveys, these surveys had the highest number of responses, followed by the later solicited <italic>Healthcare Access and Utilization</italic> and <italic>SDoH</italic> surveys rolled out more recently in 2022. This order of rollout was the main source of missingness, resulting in a precipitous reduction in cohort size for those who had answers to all the SDoH questions. The second type was <italic>valid answer missingness</italic>. As participants can choose not to answer any survey questions, the data contained “skip” and “choose not to answer” responses. However, these responses accounted for a much smaller reduction in cohort size for complete data than rollout missingness. The third type was <italic>low use missingness</italic>. Although there were 259 SDoH SNOMED codes, only 93 (35.9%) had such information for &gt;20 participants that are allowed to be reported. This could be because most clinicians currently do not screen for SDoH as it is typically done by a social worker. Furthermore, we also attempted to use 3-digit zip codes to determine which subtypes had a significant association with living in a state that did not offer Medicaid expansion. However, 13.07% (1688/12,913) of the participants did not have zip code information (which was adjusted by using IPW).</p>
          <p>Together, the aforementioned 3 types of missingness impacted the size of the resulting cohort that had valid answers in the following 2 ways, which is the minimum number of participants that are allowed to be reported by <italic>All of Us</italic>. First, there was a drastic reduction in cohort size by 93.5%. However, because of the size of the overall dataset (N=372,397), we were still left with a large cohort (n=12,886), which, to the best of our knowledge, is the largest set of individuals to be analyzed for such a wide range of SDoH. Second, there were significant differences in the proportion of race, ethnicity, and age in the aforementioned cohort when compared to the overall <italic>All of Us</italic> population. Specifically, the cohort with valid answers had significantly more White, non-Hispanic, or older participants when compared to the overall cohort. This could potentially be because, once a participant has been enrolled, there is a 90-day delay in sending subsequent solicitations to complete surveys, a policy that is currently being reassessed due to its impact on missingness. Therefore, we had to correct this imbalance in demographic proportions by using IPW with the goal of identifying subtypes that were representative of the overall <italic>All of Us</italic> cohort.</p>
        </sec>
        <sec>
          <title>Granularity</title>
          <p>Because our goal was to use machine learning methods to identify SDoH subtypes, we encountered uneven granularity in the SDoH questions. Some questions were fine grained and highly correlated and, therefore, would cluster more strongly because of the nature of the granularity of the questions, not because of the SDoH mechanisms. To address this uneven granularity and make the results more interpretable, we used SDoH factors that had a coarser but more consistent level of granularity. We chose this approach because SDoH factors had already been defined; were understood by the expert panel, enabling high domain fidelity; and appeared to be at the right level of abstraction useful for clinical applications, such as referring a patient to the appropriate social services. However, because the use of coarse-grained variables loses information, future research could explore aggregating only those SDoH questions that are highly correlated while preserving the rest at the finer level of granularity and explore computational methods to merge SDoH questions into SDoH factors.</p>
        </sec>
      </sec>
      <sec>
        <title>Method: Scalability, Generalizability, and Extensibility</title>
        <p>We designed the HIT analytical framework to be scalable, enabling its use for the growing size of the data in <italic>All of Us</italic>; generalizable across cohorts and conditions; and extensible for including additional methods as needed in the future. Testing the HIT framework on the <italic>All of Us</italic> dataset provided insights into the strengths and limitations of the framework and the <italic>All of Us</italic> workbench where the analysis was conducted.</p>
        <sec>
          <title>Scalability</title>
          <p>We used 3 types of code to conduct the analysis for both research questions. The first was automatically generated code to extract the cohort, produced by <italic>All of Us</italic> once a cohort was selected using the point-and-click interface. This code was adequately scalable and generalizable and so will not be discussed further. The second was customized code to extract specific parts of the data. For example, the analysis of co-occurrences required customized code in R (R Foundation for Statistical Computing) to plot the diagrams in <xref rid="figure4" ref-type="fig">Figures 4</xref>–6. As expected, these tasks required strong programming skills, but fortunately, we did not encounter any coding or execution problems using the R or Python (Python Software Foundation) programming languages. However, there were significant server issues that hampered our analysis. Although the workbench instructions stated that code running on the workbench for &gt;2 weeks would be terminated and all intermediate results would be deleted, we frequently encountered our work disappearing at shorter intervals. These disruptions resulted in a higher consumption of the free server time credits resulting in fewer analyses that could be conducted. The third type of code was machine learning code that we had previously developed and disseminated on Comprehensive R Archive Network [<xref ref-type="bibr" rid="ref78">78</xref>-<xref ref-type="bibr" rid="ref80">80</xref>] to conduct the bipartite network analysis and the significance testing and visualize the network. As this code was designed to be generalizable and scalable, we did not encounter any issues in the execution of our code (in addition to the same server issues mentioned previously). Finally, the visualization of our networks worked as expected, and we used them to help interpret the patterns in the data.</p>
        </sec>
        <sec>
          <title>Generalizability</title>
          <p>Our code for the first 2 steps of the HIT framework is in Project Jupyter notebooks and has been used to analyze other cohorts that were filtered for age and previous conditions. For example, we extracted a cohort (n=4090) of participants with diabetes aged ≥65 years with complete data on 18 SDoH variables selected through consensus by 2 experienced health services researchers and guided by the Andersen behavioral model. The analysis [<xref ref-type="bibr" rid="ref81">81</xref>,<xref ref-type="bibr" rid="ref82">82</xref>] revealed 7 SDoH subtypes with statistically significant modularity compared with 100 random permutations of the data (<italic>All of Us</italic>=0.51; random mean 0.38 SD 0.0065; <italic>z</italic>=20; <italic>P</italic>&lt;.001) and that were not only clinically meaningful but also significant in different degrees for the outcome. Our subsequent attempt at increasing the number of SDoH variables from 18 to 110 for participants with diabetes who had valid answers led to an extremely small cohort size (n=926; <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>) due to the missingness that we described previously. While this reduction resulted in our current strategy of analyzing all participants regardless of condition or age, these experiments demonstrate that our approach is generalizable to other subsets of the data.</p>
        </sec>
        <sec>
          <title>Extensibility</title>
          <p>The HIT model is designed to be extensible to include other methods. For example, the model could use other biclustering (eg, nonnegative matrix factorization [<xref ref-type="bibr" rid="ref83">83</xref>]) and causal modeling methods and different types of classification (eg, deep learning [<xref ref-type="bibr" rid="ref84">84</xref>]) and prediction methods (eg, subgroup-specific modeling [<xref ref-type="bibr" rid="ref40">40</xref>]) to build the decision support system in the translational step (<xref rid="figure2" ref-type="fig">Figure 2</xref>). Furthermore, the model can integrate a wide range of datatypes to enable analysis of how each subtype is associated with them, resulting in a layered interpretation of the SDoH subtypes, as we have demonstrated. For example, as the percentage of participants who have genomic information increases (currently, &gt;25% of our cohort have missing genomic information), our pipeline will be able to integrate such information into our analysis. Finally, the integration of different datatypes required a diverse team consisting of experts in machine learning, biostatistics, programming, clinical care, health services research, gerontology, and ethics to enable a 360° analysis and interpretation of the subtypes that was, therefore, aligned with the human-centered artificial intelligence approach [<xref ref-type="bibr" rid="ref64">64</xref>-<xref ref-type="bibr" rid="ref66">66</xref>]. Furthermore, the use of the workbench to share results through visualizations operationalized <italic>team-centered informatics</italic> [<xref ref-type="bibr" rid="ref85">85</xref>] designed to facilitate multidisciplinary translational teams [<xref ref-type="bibr" rid="ref86">86</xref>] working more effectively across disciplinary boundaries with the goal of analyzing subtypes and designing targeted interventions.</p>
        </sec>
      </sec>
      <sec>
        <title>Theory: Model Building and Translational Implications</title>
        <p>The identification of SDoH subtypes has strong implications for model building in addition to translational applications. As shown in <xref rid="figure8" ref-type="fig">Figure 8</xref>, while the current classification of 5 SDoH domains has a hierarchical relationship with the SDoH factors, the data-driven clusters have a more complex association with the same SDoH factors. This reflects the complexity of how SDoH occur in the real world while at the same time being interpretable for purposes of translation.</p>
        <p>Future studies should develop prediction models using the data-driven subtypes to determine whether they improve the accuracy of predicting adverse health outcomes when compared to models that do not use those subtypes. Because the subtypes were clinically interpretable, they could be used to build classification and prediction models and used with an interface to develop a clinical decision support system that helps triage patients to critical services. For example, the St Vincent’s House [<xref ref-type="bibr" rid="ref87">87</xref>] in Galveston, Texas, United States, provides several services to address SDoH, including free walk-in clinical care, nurse practitioners with reduced insurance co-payments, English- and Spanish-speaking free mental health counseling, free dental health clinic, utility and rental assistance, case management, financial literacy, expanded food pantry, weekly free home delivery of pantry groceries, snack pack for people experiencing homelessness, free transportation to clinician’s appointments, immigration legal services, and spiritual counseling. Given the availability of this wide range of services in many communities across the United States, a decision support system could help classify an individual based on their SDoH profile into one or more of the subtypes and measure their risk of an adverse health outcome. Such information could be used by clinicians to collaboratively explore solutions with the patient to consider one or more of such local services based on the membership strength to a subtype and the associated risk (<xref rid="figure2" ref-type="fig">Figure 2</xref>, step 3). At a population level, understanding health risks associated with clusters may assist institutions and organizations in developing more effective prevention programs.</p>
      </sec>
      <sec>
        <title>Notebooks for <italic>All of Us</italic> Community Use</title>
        <p>Because the missingness in SDoH variables is expected to decrease, their characterization and subtyping will need to be repeated and verified for different cohorts. Therefore, we have made the following 2 sets of code available for general use by the <italic>All of Us</italic> researcher community (accessible after creating a free account on <italic>All of Us</italic> and completing the required training).</p>
        <sec>
          <title>SDoH Valid Answer Tracker</title>
          <p>This set of notebooks generates four plots that can be used by other researchers on <italic>All of Us</italic> to characterize any cohort: (1) valid response plot to show how many participants have data with valid responses and colored by SDoH domain, (2) Venn diagram showing how many participants have valid responses for all questions within each survey, and (3) frequency distribution plot showing co-occurrence of SDoH across the selected cohort. This set of tools should enable researchers to characterize SDoH across different cohorts to help determine methods that are appropriate to adjust for missingness in those cohorts.</p>
        </sec>
        <sec>
          <title>SDoH Subtyper</title>
          <p>This set of notebooks can be used to conduct the following analyses: (1) bicluster modularity of a cohort with the 18 SDoH factors to identify the number and members of biclusters and the measure <italic>Q</italic> representing the quality of the biclustering, (2) visualization of the bipartite network, and (3) significance of the network with respect to null models.</p>
        </sec>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This study has 2 main limitations. The first emerges from the large amount of missingness in the survey data, precluding the use of imputation methods that assume a random distribution of missingness. Therefore, we could use only complete data, which led to a large drop in cohort size and which also introduced a bias in the demographics requiring a rebalancing through IPW. While such rebalancing is typically done for large datasets, the IPW method requires judgment to decide which variables to include in the model and, therefore, could have introduced additional unknown biases. Therefore, the model should be refined to determine which variables to include in the regression models that estimate the IPW-generated weights. However, because the clustering was similar between the unweighted and IPW-weighted networks, we believe that the current subtypes are stable and meaningful and represent the demographic composition of the full <italic>All of Us</italic> dataset, but this needs to be verified by redoing the analysis as the data become more complete. The limitation of missingness in the surveys is expected to be addressed as <italic>All of Us</italic> has recently removed the requirement of waiting 90 days before a subsequent survey is given to an enrollee in the program, potentially reducing the degree of missingness. The second limitation is due to the high computational cost of empirically determining the significance of the biclustering. As such analysis is computationally expensive and time-consuming, it limited the experiments we could do to test different cohorts and models. Therefore, we look forward to the <italic>All of Us</italic> workbench providing the ability to run batch processes more efficiently and uninterruptedly for extended periods (exceeding the current time window), which together could help alleviate this computational hurdle in the future.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>How SDoH impact health is a complex phenomenon involving many interconnected social, biological, and environmental factors that have yet to be fully elucidated. While this phenomenon has been studied for &gt;30 years, the analyses have been hampered by the lack of large cohorts representing diverse populations with a wide range of SDoH variables measured, multiple datatypes, and easy access by researchers. <italic>All of Us</italic> provides an unprecedented opportunity to directly address these limitations with the goal of doing justice to early conceptual models such as the social gradient and the Dahlgren-Whitehead model, both of which drew international attention to the complex ways in which individual and contextual SDoH factors impact health. The <italic>All of Us</italic> dataset is also timely because of the extensive health disparities that were revealed during the pandemic, which highlighted the critical need to address SDoH in the public and policy realms. However, because <italic>All of Us</italic> is still rapidly evolving to meet its target of 1 million participants or more, we conducted a systematic characterization of SDoH variables in <italic>All of Us</italic> and used the results to guide the analysis of SDoH subtypes. The identified subtypes, along with their risks, could be used to design data-informed interventions, resource-planning strategies, and public health policies aimed at reducing the risks of adverse health outcomes. However, careful consideration would be required to ensure that the identification of high-risk subtypes is not used in a way that stigmatizes subpopulations.</p>
        <p>Our first goal of characterizing the data revealed the nature of the missingness in SDoH and the uneven granularity in the SDoH questions. Both of these results led us to select the IPW method to address the missingness and to analyze subtypes using SDoH factors to address the uneven granularity. Our second goal of identifying SDoH subtypes led not only to statistically significant biclusteredness but also to their statistically significant replication and meaningful domain interpretations. These results set the stage for further investigations to build and evaluate classification and prediction models for designing decision support systems that alert clinicians of specific risks that their patients face due to a combination of SDoH factors. Furthermore, the SDoH subtypes could be used to design public health care policies that are multifactorial and need based, enabling more targeted interventions compared to policies that are based on a few sociodemographic factors such as race and income.</p>
        <p>The results also led to the design, use, and dissemination of general-purpose tools currently available on <italic>All of Us</italic> for other researchers, which will be useful to reanalyze the <italic>All of Us</italic> dataset as it grows over the next few years to directly address the high rate of missingness. These collaborative advances should position <italic>All of Us</italic> to revolutionize research for analyzing complex phenomena such as how SDoH impact health and beyond, with the goal of enabling a more equitable future that all of us deserve.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Description of bipartite network analysis.</p>
        <media xlink:href="jmir_v27i1e48775_app1.docx" xlink:title="DOCX File , 617 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Systematized Medical Nomenclature of Medicine codes related to social determinants of health and their use in the electronic health records of participants in All of Us.</p>
        <media xlink:href="jmir_v27i1e48775_app2.docx" xlink:title="DOCX File , 184 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Data conversion. A total of 4 <italic>All of Us</italic> surveys (column 2) contained 110 social determinants of health questions (column 3), which were abbreviated, negatively phrased (shown bolded), and reversed coded (shown in red; column 3); categorized into the 5 Healthy People 2030 domains (column 4 and shown by the 5 colors); and further categorized (boxes) by the expert panel into 18 factors (column 5; Delayed medical care was used as an outcome).</p>
        <media xlink:href="jmir_v27i1e48775_app3.docx" xlink:title="DOCX File , 40 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Inverse probability weighting.</p>
        <media xlink:href="jmir_v27i1e48775_app4.docx" xlink:title="DOCX File , 99 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Condition-specific cohort extraction for type 2 diabetes, breast cancer, and coronary artery disease, and inclusion and exclusion criteria for selecting 3 condition-specific cohorts.</p>
        <media xlink:href="jmir_v27i1e48775_app5.docx" xlink:title="DOCX File , 66 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ER</term>
          <def>
            <p>emergency room</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">HIT</term>
          <def>
            <p>heterogenization, integration, and translation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">HP-30</term>
          <def>
            <p>Healthy People 2030</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">IPW</term>
          <def>
            <p>inverse probability weighting</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">OR</term>
          <def>
            <p>odds ratio</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">RI</term>
          <def>
            <p>Rand index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">SDoH</term>
          <def>
            <p>social determinants of health</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">SNOMED</term>
          <def>
            <p>Systematized Medical Nomenclature of Medicine</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors thank Gautam Vallabha, PhD, for his assistance in refining the analysis and the manuscript. This study was supported in part by the Artificial Intelligence and Machine Learning Consortium to Advance Health Equity and Researcher Diversity (1OT2SD03258102293), the Clinical and Translational Science Award (UL1 TR001439) from the National Center for Advancing Translational Sciences at the National Institutes of Health, the University of Texas Medical Branch Claude D. Pepper Older Americans Independence Center funded by the National Institute on Aging at the National Institutes of Health (P30AG024832), the MD Anderson Cancer Center, the National Library of Medicine (R01 LM012095) at the National Institutes of Health, and the National Institute on Aging (K01AG058789, K01AG065492), Agency for Healthcare Research and Quality (R01-HS029891). The content is solely the responsibility of the authors and does not necessarily represent the official views of the National Institutes of Health. No part of this manuscript was generated using large language models.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The datasets analyzed in this study are publicly available from the <italic>All of Us</italic> program after registering for access [<xref ref-type="bibr" rid="ref88">88</xref>].</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>SKB and BD conceived the overall design of the analysis and wrote the manuscript. WZ, DB, and AB wrote the analytical code to analyze the data. BD designed the method for handling the missing data, identified sources for social determinants of health (SDoH), and guided the overall design of the analysis. SV identified frameworks for SDoH and guided the overall design of the analysis. YFK provided statistical guidance for the analysis. BD, SS, and TR guided the identification and granularization of the SDoH questions from the <italic>All of Us</italic> surveys. SS, MRP, TR, BD, and MR interpreted the subtypes and inferred the mechanisms and potential interventions, and VA and RH refined those interpretations. ES provided guidance on the ethical aspects of the analysis and interpretation. SV and BD had equal contribution for guiding the overall project. All authors reviewed the final manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weida</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Phojanakong</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Chilton</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Financial health as a measurable social determinant of health</article-title>
          <source>PLoS One</source>
          <year>2020</year>
          <volume>15</volume>
          <issue>5</issue>
          <fpage>e0233359</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0233359"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0233359</pub-id>
          <pub-id pub-id-type="medline">32421755</pub-id>
          <pub-id pub-id-type="pii">PONE-D-19-31725</pub-id>
          <pub-id pub-id-type="pmcid">PMC7233592</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kushel</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gee</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Haas</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Housing instability and food insecurity as barriers to health care among low-income Americans</article-title>
          <source>J Gen Intern Med</source>
          <year>2006</year>
          <month>01</month>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>71</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/16423128"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1525-1497.2005.00278.x</pub-id>
          <pub-id pub-id-type="medline">16423128</pub-id>
          <pub-id pub-id-type="pii">JGI278</pub-id>
          <pub-id pub-id-type="pmcid">PMC1484604</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <article-title>Social determinants of health</article-title>
          <source>World Health Organization</source>
          <access-date>2024-07-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/health-topics/social-determinants-of-health#tab=tab_1">https://www.who.int/health-topics/social-determinants-of-health#tab=tab_1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dahlgren</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Whitehead</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The Dahlgren-Whitehead model of health determinants: 30 years on and still chasing rainbows</article-title>
          <source>Public Health</source>
          <year>2021</year>
          <month>10</month>
          <volume>199</volume>
          <fpage>20</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.1016/j.puhe.2021.08.009</pub-id>
          <pub-id pub-id-type="medline">34534885</pub-id>
          <pub-id pub-id-type="pii">S0033-3506(21)00336-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>WK</given-names>
            </name>
          </person-group>
          <article-title>Paid sick days and health care use: an analysis of the 2007 national health interview survey data</article-title>
          <source>Am J Ind Med</source>
          <year>2011</year>
          <month>10</month>
          <volume>54</volume>
          <issue>10</issue>
          <fpage>771</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/21761429"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/ajim.20988</pub-id>
          <pub-id pub-id-type="medline">21761429</pub-id>
          <pub-id pub-id-type="pmcid">PMC3168716</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaplan</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Keil</surname>
              <given-names>JE</given-names>
            </name>
          </person-group>
          <article-title>Socioeconomic factors and cardiovascular disease: a review of the literature</article-title>
          <source>Circulation</source>
          <year>1993</year>
          <month>10</month>
          <volume>88</volume>
          <issue>4 Pt 1</issue>
          <fpage>1973</fpage>
          <lpage>98</lpage>
          <pub-id pub-id-type="doi">10.1161/01.cir.88.4.1973</pub-id>
          <pub-id pub-id-type="medline">8403348</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <article-title>Mapping key determinants of immigrants' health in Brooklyn and Queens</article-title>
          <source>Center for Migration Studies of New York (CMS)</source>
          <year>2021</year>
          <access-date>2024-07-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cmsny.org/wp-content/uploads/2021/02/Mapping-Key-Health-Determinants-for-Immigrants-Report-Center-for-Migration-Studies.pdf">https://cmsny.org/wp-content/uploads/2021/02/Mapping-Key-Health-Determinants-for-Immigrants-Report-Center-for-Migration-Studies.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <article-title>Social Determinants of Health (SDOH)</article-title>
          <source>NEJM Catalyst</source>
          <year>2017</year>
          <month>12</month>
          <day>1</day>
          <access-date>2023-06-28</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://catalyst.nejm.org/doi/full/10.1056/CAT.17.0312">https://catalyst.nejm.org/doi/full/10.1056/CAT.17.0312</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ramirez</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Gebo</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>PA</given-names>
            </name>
          </person-group>
          <article-title>Progress with the all of us research program: opening access for researchers</article-title>
          <source>JAMA</source>
          <year>2021</year>
          <month>06</month>
          <day>22</day>
          <volume>325</volume>
          <issue>24</issue>
          <fpage>2441</fpage>
          <lpage>2</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2021.7702</pub-id>
          <pub-id pub-id-type="medline">34115137</pub-id>
          <pub-id pub-id-type="pii">2781166</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>All of Us Research Program Investigators</collab>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Rutter</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Philippakis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Smoller</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Jenkins</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dishman</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The "All of Us" research program</article-title>
          <source>N Engl J Med</source>
          <year>2019</year>
          <month>08</month>
          <day>15</day>
          <volume>381</volume>
          <issue>7</issue>
          <fpage>668</fpage>
          <lpage>76</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31412182"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMsr1809937</pub-id>
          <pub-id pub-id-type="medline">31412182</pub-id>
          <pub-id pub-id-type="pmcid">PMC8291101</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ramirez</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Sulieman</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Schlueter</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Halvorson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ratsimbazafy</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Loperena</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mayo</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Basford</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Deflaux</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Muthuraman</surname>
              <given-names>KN</given-names>
            </name>
            <name name-style="western">
              <surname>Natarajan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kho</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wilkins</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Anton-Culver</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Boerwinkle</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Cicek</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Cohn</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ohno-Machado</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Schully</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmedani</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Argos</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cronin</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>O'Donnell</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fouad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Greenland</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hebbring</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Karlson</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Khatri</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Korf</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Smoller</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Sodeke</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wilbanks</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hentges</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mockrin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lunt</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Devaney</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Gebo</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Denny</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Glazer</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Hripcsak</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Philippakis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Roden</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>The All of Us Research Program: data quality, utility, and diversity</article-title>
          <source>Patterns (N Y)</source>
          <year>2022</year>
          <month>08</month>
          <day>12</day>
          <volume>3</volume>
          <issue>8</issue>
          <fpage>100570</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2666-3899(22)00181-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.patter.2022.100570</pub-id>
          <pub-id pub-id-type="medline">36033590</pub-id>
          <pub-id pub-id-type="pii">S2666-3899(22)00181-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC9403360</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marmot</surname>
              <given-names>MG</given-names>
            </name>
          </person-group>
          <article-title>Status syndrome: a challenge to medicine</article-title>
          <source>JAMA</source>
          <year>2006</year>
          <month>03</month>
          <day>15</day>
          <volume>295</volume>
          <issue>11</issue>
          <fpage>1304</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.295.11.1304</pub-id>
          <pub-id pub-id-type="medline">16537740</pub-id>
          <pub-id pub-id-type="pii">295/11/1304</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adler</surname>
              <given-names>NE</given-names>
            </name>
            <name name-style="western">
              <surname>Ostrove</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Socioeconomic status and health: what we know and what we don't</article-title>
          <source>Ann N Y Acad Sci</source>
          <year>1999</year>
          <volume>896</volume>
          <fpage>3</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1749-6632.1999.tb08101.x</pub-id>
          <pub-id pub-id-type="medline">10681884</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mackenbach</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Bos</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Andersen</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Cardano</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Costa</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Harding</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Reid</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hemström</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Valkonen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kunst</surname>
              <given-names>AE</given-names>
            </name>
          </person-group>
          <article-title>Widening socioeconomic inequalities in mortality in six Western European countries</article-title>
          <source>Int J Epidemiol</source>
          <year>2003</year>
          <month>10</month>
          <volume>32</volume>
          <issue>5</issue>
          <fpage>830</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://core.ac.uk/reader/18602492?utm_source=linkout"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/ije/dyg209</pub-id>
          <pub-id pub-id-type="medline">14559760</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McDonough</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Duncan</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>House</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Income dynamics and adult mortality in the United States, 1972 through 1989</article-title>
          <source>Am J Public Health</source>
          <year>1997</year>
          <month>09</month>
          <volume>87</volume>
          <issue>9</issue>
          <fpage>1476</fpage>
          <lpage>83</lpage>
          <pub-id pub-id-type="doi">10.2105/ajph.87.9.1476</pub-id>
          <pub-id pub-id-type="medline">9314800</pub-id>
          <pub-id pub-id-type="pmcid">PMC1380973</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dahlgren</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Whitehead</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Policies and strategies to promote social equity in health. Background document to WHO - Strategy paper for Europe</article-title>
          <source>Institutet för Framtidsstudier</source>
          <year>1991</year>
          <access-date>2024-05-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchgate.net/publication/5095964_Policies_and_strategies_to_promote_social_equity_in_health_Background_document_to_WHO_-_Strategy_paper_for_Europe">https://www.researchgate.net/publication/5095964_Policies_and_strategies_to_promote_social_equity_in_health_Background_document_to_WHO_-_Strategy_paper_for_Europe</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lucyk</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>McLaren</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Taking stock of the social determinants of health: a scoping review</article-title>
          <source>PLoS One</source>
          <year>2017</year>
          <volume>12</volume>
          <issue>5</issue>
          <fpage>e0177306</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0177306"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0177306</pub-id>
          <pub-id pub-id-type="medline">28493934</pub-id>
          <pub-id pub-id-type="pii">PONE-D-16-41569</pub-id>
          <pub-id pub-id-type="pmcid">PMC5426664</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Muller</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Education, income inequality, and mortality: a multiple regression analysis</article-title>
          <source>BMJ</source>
          <year>2002</year>
          <month>01</month>
          <day>05</day>
          <volume>324</volume>
          <issue>7328</issue>
          <fpage>23</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/11777800"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.324.7328.23</pub-id>
          <pub-id pub-id-type="medline">11777800</pub-id>
          <pub-id pub-id-type="pmcid">PMC61654</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hill-Briggs</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Adler</surname>
              <given-names>NE</given-names>
            </name>
            <name name-style="western">
              <surname>Berkowitz</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Chin</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Gary-Webb</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Navas-Acien</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thornton</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Haire-Joshu</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Social determinants of health and diabetes: a scientific review</article-title>
          <source>Diabetes Care</source>
          <year>2020</year>
          <month>11</month>
          <day>02</day>
          <volume>44</volume>
          <issue>1</issue>
          <fpage>258</fpage>
          <lpage>79</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33139407"/>
          </comment>
          <pub-id pub-id-type="doi">10.2337/dci20-0053</pub-id>
          <pub-id pub-id-type="medline">33139407</pub-id>
          <pub-id pub-id-type="pii">dci20-0053</pub-id>
          <pub-id pub-id-type="pmcid">PMC7783927</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
          <article-title>PhenX Social Determinants of Health (SDOH) assessments collection</article-title>
          <source>National Institutes of Health National Institute on Minority Health and Health Disparities</source>
          <access-date>2024-01-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nimhd.nih.gov/resources/phenx/">https://www.nimhd.nih.gov/resources/phenx/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hamilton</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Strader</surname>
              <given-names>LC</given-names>
            </name>
            <name name-style="western">
              <surname>Pratt</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Maiese</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hendershot</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kwok</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Hammond</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Huggins</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Jackman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Nettles</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Beaty</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Farrer</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Kraft</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Marazita</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Ordovas</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Pato</surname>
              <given-names>CN</given-names>
            </name>
            <name name-style="western">
              <surname>Spitz</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Wagener</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Junkins</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Harlan</surname>
              <given-names>WR</given-names>
            </name>
            <name name-style="western">
              <surname>Ramos</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Haines</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The PhenX Toolkit: get the most from your measures</article-title>
          <source>Am J Epidemiol</source>
          <year>2011</year>
          <month>08</month>
          <day>01</day>
          <volume>174</volume>
          <issue>3</issue>
          <fpage>253</fpage>
          <lpage>60</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/21749974"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/aje/kwr193</pub-id>
          <pub-id pub-id-type="medline">21749974</pub-id>
          <pub-id pub-id-type="pii">kwr193</pub-id>
          <pub-id pub-id-type="pmcid">PMC3141081</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <article-title>Social determinants of health collections</article-title>
          <source>PhenX Toolkit</source>
          <access-date>2024-07-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.phenxtoolkit.org/collections/view/6">https://www.phenxtoolkit.org/collections/view/6</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <article-title>CMS framework for health equity 2022–2032</article-title>
          <source>Centers for Medicare &amp; Medicaid Services</source>
          <access-date>2024-07-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cms.gov/files/document/cms-framework-health-equity.pdf">https://www.cms.gov/files/document/cms-framework-health-equity.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Green</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zook</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>When talking about social determinants, precision matters</article-title>
          <source>Health Affairs</source>
          <year>2019</year>
          <month>10</month>
          <day>29</day>
          <access-date>2024-07-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.healthaffairs.org/content/forefront/talking-social-determinants-precision-matters">https://www.healthaffairs.org/content/forefront/talking-social-determinants-precision-matters</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Craven</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Highfield</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Basit</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bernstam</surname>
              <given-names>EV</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>BY</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrer</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Gelfond</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Pruitt</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Kannan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Shireman</surname>
              <given-names>PK</given-names>
            </name>
            <name name-style="western">
              <surname>Spratt</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Morales</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zozus</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Sankary</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Toward standardization, harmonization, and integration of social determinants of health data: a Texas Clinical and Translational Science Award institutions collaboration</article-title>
          <source>J Clin Transl Sci</source>
          <year>2024</year>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>e17</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38384919"/>
          </comment>
          <pub-id pub-id-type="doi">10.1017/cts.2024.2</pub-id>
          <pub-id pub-id-type="medline">38384919</pub-id>
          <pub-id pub-id-type="pii">S2059866124000025</pub-id>
          <pub-id pub-id-type="pmcid">PMC10880009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McClellan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>MC</given-names>
            </name>
          </person-group>
          <article-title>Genetic heterogeneity in human disease</article-title>
          <source>Cell</source>
          <year>2010</year>
          <month>04</month>
          <day>16</day>
          <volume>141</volume>
          <issue>2</issue>
          <fpage>210</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0092-8674(10)00320-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cell.2010.03.032</pub-id>
          <pub-id pub-id-type="medline">20403315</pub-id>
          <pub-id pub-id-type="pii">S0092-8674(10)00320-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Waldman</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Terzic</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Therapeutic targeting: a crucible for individualized medicine</article-title>
          <source>Clin Pharmacol Ther</source>
          <year>2008</year>
          <month>05</month>
          <volume>83</volume>
          <issue>5</issue>
          <fpage>651</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.1038/clpt.2008.65</pub-id>
          <pub-id pub-id-type="medline">18425084</pub-id>
          <pub-id pub-id-type="pii">clpt200865</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rouzier</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Perou</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Symmans</surname>
              <given-names>WF</given-names>
            </name>
            <name name-style="western">
              <surname>Ibrahim</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Cristofanilli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hess</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Stec</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ayers</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wagner</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Morandi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rabiul</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Hortobagyi</surname>
              <given-names>GN</given-names>
            </name>
            <name name-style="western">
              <surname>Pusztai</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Breast cancer molecular subtypes respond differently to preoperative chemotherapy</article-title>
          <source>Clin Cancer Res</source>
          <year>2005</year>
          <month>08</month>
          <day>15</day>
          <volume>11</volume>
          <issue>16</issue>
          <fpage>5678</fpage>
          <lpage>85</lpage>
          <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-04-2421</pub-id>
          <pub-id pub-id-type="medline">16115903</pub-id>
          <pub-id pub-id-type="pii">11/16/5678</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sørlie</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Perou</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Tibshirani</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Aas</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Geisler</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Johnsen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hastie</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Eisen</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>van de Rin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jeffrey</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Thorsen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Quist</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Matese</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>PO</given-names>
            </name>
            <name name-style="western">
              <surname>Botstein</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lønning</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Børresen-Dale</surname>
              <given-names>AL</given-names>
            </name>
          </person-group>
          <article-title>Gene expression patterns of breast carcinomas distinguish tumor subclasses with clinical implications</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2001</year>
          <month>09</month>
          <day>11</day>
          <volume>98</volume>
          <issue>19</issue>
          <fpage>10869</fpage>
          <lpage>74</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&amp;pmid=11553815"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.191367098</pub-id>
          <pub-id pub-id-type="medline">11553815</pub-id>
          <pub-id pub-id-type="pii">98/19/10869</pub-id>
          <pub-id pub-id-type="pmcid">PMC58566</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fitzpatrick</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Teague</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Meyers</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wenzel</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Aujla</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Castro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bacharier</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>Gaston</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Bleecker</surname>
              <given-names>ER</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>WC</given-names>
            </name>
          </person-group>
          <article-title>Heterogeneity of severe asthma in childhood: confirmation by cluster analysis of children in the National Institutes of Health/National Heart, Lung, and Blood Institute Severe Asthma Research Program</article-title>
          <source>J Allergy Clin Immunol</source>
          <year>2011</year>
          <month>02</month>
          <volume>127</volume>
          <issue>2</issue>
          <fpage>382</fpage>
          <lpage>9.e1</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/21195471"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jaci.2010.11.015</pub-id>
          <pub-id pub-id-type="medline">21195471</pub-id>
          <pub-id pub-id-type="pii">S0091-6749(10)01765-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC3060668</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haldar</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pavord</surname>
              <given-names>ID</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Berry</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brightling</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Wardlaw</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Green</surname>
              <given-names>RH</given-names>
            </name>
          </person-group>
          <article-title>Cluster analysis and clinical asthma phenotypes</article-title>
          <source>Am J Respir Crit Care Med</source>
          <year>2008</year>
          <month>08</month>
          <day>01</day>
          <volume>178</volume>
          <issue>3</issue>
          <fpage>218</fpage>
          <lpage>24</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/18480428"/>
          </comment>
          <pub-id pub-id-type="doi">10.1164/rccm.200711-1754OC</pub-id>
          <pub-id pub-id-type="medline">18480428</pub-id>
          <pub-id pub-id-type="pmcid">PMC3992366</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lötvall</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Akdis</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Bacharier</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>Bjermer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Casale</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Custovic</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lemanske</surname>
              <given-names>RF Jr</given-names>
            </name>
            <name name-style="western">
              <surname>Wardlaw</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wenzel</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Greenberger</surname>
              <given-names>PA</given-names>
            </name>
          </person-group>
          <article-title>Asthma endotypes: a new approach to classification of disease entities within the asthma syndrome</article-title>
          <source>J Allergy Clin Immunol</source>
          <year>2011</year>
          <month>02</month>
          <volume>127</volume>
          <issue>2</issue>
          <fpage>355</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jaci.2010.11.037</pub-id>
          <pub-id pub-id-type="medline">21281866</pub-id>
          <pub-id pub-id-type="pii">S0091-6749(10)01858-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nair</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pizzichini</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Kjarsgaard</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Inman</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Efthimiadis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pizzichini</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hargreave</surname>
              <given-names>FE</given-names>
            </name>
            <name name-style="western">
              <surname>O'Byrne</surname>
              <given-names>PM</given-names>
            </name>
          </person-group>
          <article-title>Mepolizumab for prednisone-dependent asthma with sputum eosinophilia</article-title>
          <source>N Engl J Med</source>
          <year>2009</year>
          <month>03</month>
          <day>05</day>
          <volume>360</volume>
          <issue>10</issue>
          <fpage>985</fpage>
          <lpage>93</lpage>
          <pub-id pub-id-type="doi">10.1056/NEJMoa0805435</pub-id>
          <pub-id pub-id-type="medline">19264687</pub-id>
          <pub-id pub-id-type="pii">360/10/985</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ortega</surname>
              <given-names>HG</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Pavord</surname>
              <given-names>ID</given-names>
            </name>
            <name name-style="western">
              <surname>Brusselle</surname>
              <given-names>GG</given-names>
            </name>
            <name name-style="western">
              <surname>FitzGerald</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Chetta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Humbert</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Katz</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Keene</surname>
              <given-names>ON</given-names>
            </name>
            <name name-style="western">
              <surname>Yancey</surname>
              <given-names>SW</given-names>
            </name>
            <name name-style="western">
              <surname>Chanez</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Mepolizumab treatment in patients with severe eosinophilic asthma</article-title>
          <source>N Engl J Med</source>
          <year>2014</year>
          <month>09</month>
          <day>25</day>
          <volume>371</volume>
          <issue>13</issue>
          <fpage>1198</fpage>
          <lpage>207</lpage>
          <pub-id pub-id-type="doi">10.1056/nejmoa1403290</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>FS</given-names>
            </name>
            <name name-style="western">
              <surname>Varmus</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A new initiative on precision medicine</article-title>
          <source>N Engl J Med</source>
          <year>2015</year>
          <month>02</month>
          <day>26</day>
          <volume>372</volume>
          <issue>9</issue>
          <fpage>793</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25635347"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMp1500523</pub-id>
          <pub-id pub-id-type="medline">25635347</pub-id>
          <pub-id pub-id-type="pmcid">PMC5101938</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lacy</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Wellenius</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Carnethon</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Loucks</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Carson</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Kiefe</surname>
              <given-names>CI</given-names>
            </name>
            <name name-style="western">
              <surname>Gjelsvik</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gunderson</surname>
              <given-names>EP</given-names>
            </name>
            <name name-style="western">
              <surname>Eaton</surname>
              <given-names>CB</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>WC</given-names>
            </name>
          </person-group>
          <article-title>Racial differences in the performance of existing risk prediction models for incident type 2 diabetes: the CARDIA study</article-title>
          <source>Diabetes Care</source>
          <year>2016</year>
          <month>02</month>
          <volume>39</volume>
          <issue>2</issue>
          <fpage>285</fpage>
          <lpage>91</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26628420"/>
          </comment>
          <pub-id pub-id-type="doi">10.2337/dc15-0509</pub-id>
          <pub-id pub-id-type="medline">26628420</pub-id>
          <pub-id pub-id-type="pii">dc15-0509</pub-id>
          <pub-id pub-id-type="pmcid">PMC4722943</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>Medicare payment system for hospital inpatients: diagnosis-related groups</article-title>
          <source>J Health Care Finance</source>
          <year>2002</year>
          <volume>28</volume>
          <issue>3</issue>
          <fpage>1</fpage>
          <lpage>13</lpage>
          <pub-id pub-id-type="medline">12079147</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lipkovich</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Dmitrienko</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Denne</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Enas</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Subgroup identification based on differential effect search--a recursive partitioning method for establishing response to treatment in patient subpopulations</article-title>
          <source>Stat Med</source>
          <year>2011</year>
          <month>09</month>
          <day>20</day>
          <volume>30</volume>
          <issue>21</issue>
          <fpage>2601</fpage>
          <lpage>21</lpage>
          <pub-id pub-id-type="doi">10.1002/sim.4289</pub-id>
          <pub-id pub-id-type="medline">21786278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kehl</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Ulm</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Responder identification in clinical trials with censored data</article-title>
          <source>Comput Stat Data Anal</source>
          <year>2006</year>
          <month>03</month>
          <volume>50</volume>
          <issue>5</issue>
          <fpage>1338</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1016/j.csda.2004.11.015</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hastie</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tibshirani</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>JH</given-names>
            </name>
          </person-group>
          <source>The Elements of Statistical Learning: Data Mining, Inference, and Prediction</source>
          <year>2001</year>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abu-Jamous</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Fa</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Nandi</surname>
              <given-names>AK</given-names>
            </name>
          </person-group>
          <source>Integrative Cluster Analysis in Bioinformatics</source>
          <year>2015</year>
          <publisher-loc>Hoboken, NJ</publisher-loc>
          <publisher-name>John Wiley &amp; Sons</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lochner</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Cox</surname>
              <given-names>CS</given-names>
            </name>
          </person-group>
          <article-title>Prevalence of multiple chronic conditions among Medicare beneficiaries, United States, 2010</article-title>
          <source>Prev Chronic Dis</source>
          <year>2013</year>
          <month>04</month>
          <day>25</day>
          <volume>10</volume>
          <fpage>E61</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23618541"/>
          </comment>
          <pub-id pub-id-type="doi">10.5888/pcd10.120137</pub-id>
          <pub-id pub-id-type="medline">23618541</pub-id>
          <pub-id pub-id-type="pii">E61</pub-id>
          <pub-id pub-id-type="pmcid">PMC3652723</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aryal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Diaz-Guzman</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Mannino</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Rabe</surname>
              <given-names>KF</given-names>
            </name>
            <name name-style="western">
              <surname>Wedzica</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Wouters</surname>
              <given-names>EF</given-names>
            </name>
          </person-group>
          <article-title>Prevalence of COPD and comorbidity</article-title>
          <source>COPD and Comorbidity</source>
          <year>2013</year>
          <publisher-loc>Sheffield, UK</publisher-loc>
          <publisher-name>European Respiratory Society</publisher-name>
          <fpage>1</fpage>
          <lpage>12</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baty</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Putora</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Isenring</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Blum</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Brutsche</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Comorbidities and burden of COPD: a population based case-control study</article-title>
          <source>PLoS One</source>
          <year>2013</year>
          <volume>8</volume>
          <issue>5</issue>
          <fpage>e63285</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0063285"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0063285</pub-id>
          <pub-id pub-id-type="medline">23691009</pub-id>
          <pub-id pub-id-type="pii">PONE-D-12-37141</pub-id>
          <pub-id pub-id-type="pmcid">PMC3656944</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moni</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Liò</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Network-based analysis of comorbidities risk during an infection: SARS and HIV case studies</article-title>
          <source>BMC Bioinformatics</source>
          <year>2014</year>
          <month>10</month>
          <day>24</day>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>333</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-15-333"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2105-15-333</pub-id>
          <pub-id pub-id-type="medline">25344230</pub-id>
          <pub-id pub-id-type="pii">1471-2105-15-333</pub-id>
          <pub-id pub-id-type="pmcid">PMC4363349</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cramer</surname>
              <given-names>AO</given-names>
            </name>
            <name name-style="western">
              <surname>Waldorp</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>van der Maas</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Borsboom</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Comorbidity: a network perspective</article-title>
          <source>Behav Brain Sci</source>
          <year>2010</year>
          <month>06</month>
          <volume>33</volume>
          <issue>2-3</issue>
          <fpage>137</fpage>
          <lpage>50; discussion 150</lpage>
          <pub-id pub-id-type="doi">10.1017/S0140525X09991567</pub-id>
          <pub-id pub-id-type="medline">20584369</pub-id>
          <pub-id pub-id-type="pii">S0140525X09991567</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Islam</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Valderas</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Yen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Dawda</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Jowsey</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>McRae</surname>
              <given-names>IS</given-names>
            </name>
          </person-group>
          <article-title>Multimorbidity and comorbidity of chronic diseases among the senior Australians: prevalence and patterns</article-title>
          <source>PLoS One</source>
          <year>2014</year>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>e83783</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0083783"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0083783</pub-id>
          <pub-id pub-id-type="medline">24421905</pub-id>
          <pub-id pub-id-type="pii">PONE-D-13-31674</pub-id>
          <pub-id pub-id-type="pmcid">PMC3885451</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Folino</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Pizzuti</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ventura</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A comorbidity network approach to predict disease risk</article-title>
          <source>Proceedings of the Information, Technology in Bio- and Medical Informatics</source>
          <year>2010</year>
          <conf-name>ITBAM 2010</conf-name>
          <conf-date>September 1-2, 2010</conf-date>
          <conf-loc>Bilbao, Spain</conf-loc>
          <pub-id pub-id-type="doi">10.1007/978-3-642-15020-3_10</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Newman</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Networks: An Introduction</source>
          <year>2010</year>
          <publisher-loc>Oxford, UK</publisher-loc>
          <publisher-name>Oxford University Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Treviño</surname>
              <given-names>S III</given-names>
            </name>
            <name name-style="western">
              <surname>Nyberg</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Del Genio</surname>
              <given-names>CI</given-names>
            </name>
            <name name-style="western">
              <surname>Bassler</surname>
              <given-names>KE</given-names>
            </name>
          </person-group>
          <article-title>Fast and accurate determination of modularity and its effect size</article-title>
          <source>J Stat Mech Theor Exp</source>
          <year>2015</year>
          <month>02</month>
          <day>03</day>
          <issue>2015</issue>
          <fpage>P02003</fpage>
          <pub-id pub-id-type="doi">10.1088/1742-5468/2015/02/P02003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chauhan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ravi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Datta</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Schnappinger</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bassler</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Balázsi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gennaro</surname>
              <given-names>ML</given-names>
            </name>
          </person-group>
          <article-title>Reconstruction and topological characterization of the sigma factor regulatory network of Mycobacterium tuberculosis</article-title>
          <source>Nat Commun</source>
          <year>2016</year>
          <month>03</month>
          <day>31</day>
          <volume>7</volume>
          <fpage>11062</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/ncomms11062"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/ncomms11062</pub-id>
          <pub-id pub-id-type="medline">27029515</pub-id>
          <pub-id pub-id-type="pii">ncomms11062</pub-id>
          <pub-id pub-id-type="pmcid">PMC4821874</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Dang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Penton</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Visweswaran</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bassler</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Raji</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Divekar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zuhour</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Karmarkar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>YF</given-names>
            </name>
            <name name-style="western">
              <surname>Ottenbacher</surname>
              <given-names>KJ</given-names>
            </name>
          </person-group>
          <article-title>How high-risk comorbidities co-occur in readmitted patients with hip fracture: big data visual analytical approach</article-title>
          <source>JMIR Med Inform</source>
          <year>2020</year>
          <month>10</month>
          <day>26</day>
          <volume>8</volume>
          <issue>10</issue>
          <fpage>e13567</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2020/10/e13567/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13567</pub-id>
          <pub-id pub-id-type="medline">33103657</pub-id>
          <pub-id pub-id-type="pii">v8i10e13567</pub-id>
          <pub-id pub-id-type="pmcid">PMC7652691</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fruchterman</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Reingold</surname>
              <given-names>EM</given-names>
            </name>
          </person-group>
          <article-title>Graph drawing by force‐directed placement</article-title>
          <source>Softw Pract Exp</source>
          <year>2006</year>
          <month>10</month>
          <day>30</day>
          <volume>21</volume>
          <issue>11</issue>
          <fpage>1129</fpage>
          <lpage>64</lpage>
          <pub-id pub-id-type="doi">10.1002/spe.4380211102</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bassler</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
          </person-group>
          <article-title>ExplodeLayout: enhancing the comprehension of large and dense networks</article-title>
          <source>Proceedings of AMIA Summit on Translational Bioinformatics</source>
          <year>2016</year>
          <conf-name>AMIA 2016</conf-name>
          <conf-date>March 21-22, 2016</conf-date>
          <conf-loc>San Francisco, CA</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ayyaswamy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Visweswaran</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bellala</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Divekar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bassler</surname>
              <given-names>KE</given-names>
            </name>
          </person-group>
          <article-title>Enabling comprehension of patient subgroups and characteristics in large bipartite networks: implications for precision medicine</article-title>
          <source>AMIA Jt Summits Transl Sci Proc</source>
          <year>2017</year>
          <volume>2017</volume>
          <fpage>21</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28815099"/>
          </comment>
          <pub-id pub-id-type="medline">28815099</pub-id>
          <pub-id pub-id-type="pmcid">PMC5543384</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Eichinger</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Martini</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Saxman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Jagadish</surname>
              <given-names>HV</given-names>
            </name>
            <name name-style="western">
              <surname>Kretzler</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Network analysis of genes regulated in renal diseases: implications for a molecular-based classification</article-title>
          <source>BMC Bioinformatics</source>
          <year>2009</year>
          <month>09</month>
          <day>17</day>
          <volume>10 Suppl 9</volume>
          <issue>Suppl 9</issue>
          <fpage>S3</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-10-S9-S3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2105-10-S9-S3</pub-id>
          <pub-id pub-id-type="medline">19761573</pub-id>
          <pub-id pub-id-type="pii">1471-2105-10-S9-S3</pub-id>
          <pub-id pub-id-type="pmcid">PMC2745690</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Bellala</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ganesan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Krishna</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Saxman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Silveira</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Given</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>The nested structure of cancer symptoms. Implications for analyzing co-occurrence and managing symptoms</article-title>
          <source>Methods Inf Med</source>
          <year>2010</year>
          <volume>49</volume>
          <issue>6</issue>
          <fpage>581</fpage>
          <lpage>91</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/21085743"/>
          </comment>
          <pub-id pub-id-type="doi">10.3414/ME09-01-0083</pub-id>
          <pub-id pub-id-type="medline">21085743</pub-id>
          <pub-id pub-id-type="pii">09-01-0083</pub-id>
          <pub-id pub-id-type="pmcid">PMC3647463</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Ganesan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Maslowski</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Eichinger</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Martini</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Saxman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bellala</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kretzler</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Discovering hidden relationships between renal diseases and regulated genes through 3D network visualizations</article-title>
          <source>BMC Res Notes</source>
          <year>2010</year>
          <month>11</month>
          <day>11</day>
          <volume>3</volume>
          <fpage>296</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcresnotes.biomedcentral.com/articles/10.1186/1756-0500-3-296"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1756-0500-3-296</pub-id>
          <pub-id pub-id-type="medline">21070623</pub-id>
          <pub-id pub-id-type="pii">1756-0500-3-296</pub-id>
          <pub-id pub-id-type="pmcid">PMC3001742</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Victor</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Calhoun</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Busse</surname>
              <given-names>WW</given-names>
            </name>
            <name name-style="western">
              <surname>Bleecker</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Castro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ju</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Pillai</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Oezguen</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bellala</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Brasier</surname>
              <given-names>AR</given-names>
            </name>
          </person-group>
          <article-title>How cytokines co-occur across asthma patients: from bipartite network analysis to a molecular-based classification</article-title>
          <source>J Biomed Inform</source>
          <year>2011</year>
          <month>12</month>
          <volume>44 Suppl 1</volume>
          <issue>Suppl 1</issue>
          <fpage>S24</fpage>
          <lpage>30</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(11)00166-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2011.09.006</pub-id>
          <pub-id pub-id-type="medline">21986291</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(11)00166-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC3277832</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Bellala</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Victor</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bassler</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Visweswaran</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The role of complementary bipartite visual analytical representations in the analysis of SNPs: a case study in ancestral informative markers</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2012</year>
          <month>06</month>
          <volume>19</volume>
          <issue>e1</issue>
          <fpage>e5</fpage>
          <lpage>12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22718038"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000745</pub-id>
          <pub-id pub-id-type="medline">22718038</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000745</pub-id>
          <pub-id pub-id-type="pmcid">PMC3392853</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Dang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bellala</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Divekar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Visweswaran</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Brasier</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Kurosky</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Unlocking proteomic heterogeneity in complex diseases through visual analytics</article-title>
          <source>Proteomics</source>
          <year>2015</year>
          <month>04</month>
          <volume>15</volume>
          <issue>8</issue>
          <fpage>1405</fpage>
          <lpage>18</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25684269"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/pmic.201400451</pub-id>
          <pub-id pub-id-type="medline">25684269</pub-id>
          <pub-id pub-id-type="pmcid">PMC4471338</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Dang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kilaru</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Caro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Visweswaran</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Saade</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Menon</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Methylation differences reveal heterogeneity in preterm pathophysiology: results from bipartite network analyses</article-title>
          <source>J Perinat Med</source>
          <year>2018</year>
          <month>07</month>
          <day>26</day>
          <volume>46</volume>
          <issue>5</issue>
          <fpage>509</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28665803"/>
          </comment>
          <pub-id pub-id-type="doi">10.1515/jpm-2017-0126</pub-id>
          <pub-id pub-id-type="medline">28665803</pub-id>
          <pub-id pub-id-type="pii">jpm-2017-0126</pub-id>
          <pub-id pub-id-type="pmcid">PMC5971156</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Kummerfeld</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>YF</given-names>
            </name>
            <name name-style="western">
              <surname>Garg</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Visweswaran</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Raji</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Radhakrishnan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Golvoko</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hatch</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Usher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Melton-Meaux</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Tignanelli</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Heterogeneity in COVID-19 patients at multiple levels of granularity: from biclusters to clinical interventions</article-title>
          <source>AMIA Jt Summits Transl Sci Proc</source>
          <year>2021</year>
          <volume>2021</volume>
          <fpage>112</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34457125"/>
          </comment>
          <pub-id pub-id-type="medline">34457125</pub-id>
          <pub-id pub-id-type="pii">3479237</pub-id>
          <pub-id pub-id-type="pmcid">PMC8378636</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shneiderman</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Human-centered AI: ensuring human control while increasing automation</article-title>
          <source>Proceedings of the 5th Workshop on Human Factors in Hypertext</source>
          <year>2022</year>
          <conf-name>HT '22</conf-name>
          <conf-date>June 28, 2022</conf-date>
          <conf-loc>Barcelona, Spain</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3538882.3542790</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Clayton</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Novak</surname>
              <given-names>LL</given-names>
            </name>
            <name name-style="western">
              <surname>Anders</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Malin</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Human-centered design to address biases in artificial intelligence</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>03</month>
          <day>24</day>
          <volume>25</volume>
          <fpage>e43251</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e43251/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/43251</pub-id>
          <pub-id pub-id-type="medline">36961506</pub-id>
          <pub-id pub-id-type="pii">v25i1e43251</pub-id>
          <pub-id pub-id-type="pmcid">PMC10132017</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shneiderman</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Human-centered artificial intelligence: reliable, safe and trustworthy</article-title>
          <source>Int J Hum Comput Interact</source>
          <year>2020</year>
          <month>03</month>
          <day>23</day>
          <volume>36</volume>
          <issue>6</issue>
          <fpage>495</fpage>
          <lpage>504</lpage>
          <pub-id pub-id-type="doi">10.1080/10447318.2020.1741118</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>NT</given-names>
            </name>
          </person-group>
          <article-title>Creation of a mapped, machine-readable taxonomy to facilitate extraction of social determinants of health data from electronic health records</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2021</year>
          <volume>2021</volume>
          <fpage>959</fpage>
          <lpage>68</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35308929"/>
          </comment>
          <pub-id pub-id-type="medline">35308929</pub-id>
          <pub-id pub-id-type="pii">3577288</pub-id>
          <pub-id pub-id-type="pmcid">PMC8861691</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Balfour</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Marmot</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Social determinants of mental health</article-title>
          <source>Int Rev Psychiatry</source>
          <year>2014</year>
          <month>08</month>
          <volume>26</volume>
          <issue>4</issue>
          <fpage>392</fpage>
          <lpage>407</lpage>
          <pub-id pub-id-type="doi">10.3109/09540261.2014.928270</pub-id>
          <pub-id pub-id-type="medline">25137105</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Busse</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yim</surname>
              <given-names>IS</given-names>
            </name>
            <name name-style="western">
              <surname>Campos</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Marshburn</surname>
              <given-names>CK</given-names>
            </name>
          </person-group>
          <article-title>Discrimination and the HPA axis: current evidence and future directions</article-title>
          <source>J Behav Med</source>
          <year>2017</year>
          <month>08</month>
          <volume>40</volume>
          <issue>4</issue>
          <fpage>539</fpage>
          <lpage>52</lpage>
          <pub-id pub-id-type="doi">10.1007/s10865-017-9830-6</pub-id>
          <pub-id pub-id-type="medline">28155003</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10865-017-9830-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Decker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weaver</surname>
              <given-names>RH</given-names>
            </name>
          </person-group>
          <article-title>Health and social determinants associated with delay of care among community-dwelling rural older adults</article-title>
          <source>Fam Community Health</source>
          <year>2024</year>
          <volume>47</volume>
          <issue>1</issue>
          <fpage>41</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1097/FCH.0000000000000386</pub-id>
          <pub-id pub-id-type="medline">37753957</pub-id>
          <pub-id pub-id-type="pii">00003727-990000000-00029</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Newton</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Keirns</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Cunningham</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hayward</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Stanley</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Uninsured adults presenting to US emergency departments: assumptions vs data</article-title>
          <source>JAMA</source>
          <year>2008</year>
          <month>10</month>
          <day>22</day>
          <volume>300</volume>
          <issue>16</issue>
          <fpage>1914</fpage>
          <lpage>24</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.300.16.1914</pub-id>
          <pub-id pub-id-type="medline">18940978</pub-id>
          <pub-id pub-id-type="pii">300/16/1914</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Visweswaran</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Raji</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>YF</given-names>
            </name>
          </person-group>
          <article-title>A framework for modeling and interpreting patient subgroups applied to hospital readmission: visual analytical approach</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <month>12</month>
          <day>07</day>
          <volume>10</volume>
          <issue>12</issue>
          <fpage>e37239</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/12/e37239/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/37239</pub-id>
          <pub-id pub-id-type="medline">35537203</pub-id>
          <pub-id pub-id-type="pii">v10i12e37239</pub-id>
          <pub-id pub-id-type="pmcid">PMC9773032</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van der Wal</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Geskus</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>ipw: an R package for inverse probability weighting</article-title>
          <source>J Stat Softw</source>
          <year>2011</year>
          <volume>43</volume>
          <issue>13</issue>
          <fpage>1</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.18637/jss.v043.i13</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thoemmes</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>AD</given-names>
            </name>
          </person-group>
          <article-title>A primer on inverse probability of treatment weighting and marginal structural models</article-title>
          <source>Emerg Adulthood</source>
          <year>2015</year>
          <month>12</month>
          <day>16</day>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>40</fpage>
          <lpage>59</lpage>
          <pub-id pub-id-type="doi">10.1177/2167696815621645</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>YH</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Fatori</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bauermeister</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Luh</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Bauermeister</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Brunoni</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Smoller</surname>
              <given-names>JW</given-names>
            </name>
          </person-group>
          <article-title>Association of everyday discrimination with depressive symptoms and suicidal ideation during the COVID-19 pandemic in the All of Us research program</article-title>
          <source>JAMA Psychiatry</source>
          <year>2022</year>
          <month>09</month>
          <day>01</day>
          <volume>79</volume>
          <issue>9</issue>
          <fpage>898</fpage>
          <lpage>906</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35895053"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamapsychiatry.2022.1973</pub-id>
          <pub-id pub-id-type="medline">35895053</pub-id>
          <pub-id pub-id-type="pii">2794428</pub-id>
          <pub-id pub-id-type="pmcid">PMC9330278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="web">
          <article-title>All of Us IRB ControlledTier revised letter 08312021</article-title>
          <source>National Institutes of Health</source>
          <year>2021</year>
          <access-date>2024-07-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchallofus.org/wp-content/themes/research-hub-wordpress-theme/media/2023/All_of_Us_IRB_ControlledTier_Revised_Letter_08312021%20-%20signed.pdf">https://www.researchallofus.org/wp-content/themes/research-hub-wordpress-theme/media/2023/All_of_Us_IRB_ControlledTier_Revised_Letter_08312021%20-%20signed.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="web">
          <article-title>Do I need my project reviewed by the All of Us Institutional Review Board (IRB) in order to access this data using the Researcher Workbench?</article-title>
          <source>All of Us Research Hub</source>
          <access-date>2024-07-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchallofus.org/faq/do-i-need-my-project-reviewed-by-the-all-of-us-institutional-review-board-irb-in-order-to-access-this-data-using-the-researcher-workbench/">https://www.researchallofus.org/faq/do-i-need-my-project-reviewed-by-the-all-of-us-institutional-review-board-irb-in-order-to-access-this-data-using-the-researcher-workbench/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>BipartiteModularityMaximization: partition bipartite network into non-overlapping biclusters by optimizing bipartite modularity</article-title>
          <source>The Comprehensive R Archive Network</source>
          <year>2023</year>
          <month>1</month>
          <day>21</day>
          <access-date>2024-07-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/BipartiteModularityMaximization/index.html">https://cran.r-project.org/web/packages/BipartiteModularityMaximization/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>ExplodeLayout: calculate exploded coordinates based on original node coordinates and node clustering membership</article-title>
          <source>The Comprehensive R Archive Network</source>
          <year>2022</year>
          <month>7</month>
          <day>1</day>
          <access-date>2024-07-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cran.r-project.org/web/packages/ExplodeLayout/index.html">https://cran.r-project.org/web/packages/ExplodeLayout/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="web">
          <article-title>CRAN R packages by number of downloads</article-title>
          <source>DataScienceMeta</source>
          <access-date>2024-07-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.datasciencemeta.com/rpackages">http://www.datasciencemeta.com/rpackages</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Bao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kuo</surname>
              <given-names>YF</given-names>
            </name>
            <name name-style="western">
              <surname>Reistetter</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hatch</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Urban</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Raji</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Downer</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>341 The impact of critical social determinants of health on personal medical decisions: analysis of older Americans in All of Us</article-title>
          <source>J Clin Transl Sci</source>
          <year>2023</year>
          <month>04</month>
          <day>24</day>
          <volume>7</volume>
          <issue>s1</issue>
          <fpage>101</fpage>
          <pub-id pub-id-type="doi">10.1017/cts.2023.385</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Bao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hatch</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Reistetter</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Downer</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>284 Generalizable machine learning methods for subtyping individuals on national health databases: case studies using data from HRS, N3C, and All of Us</article-title>
          <source>J Clin Transl Sci</source>
          <year>2023</year>
          <month>04</month>
          <day>24</day>
          <volume>7</volume>
          <issue>s1</issue>
          <fpage>85</fpage>
          <pub-id pub-id-type="doi">10.1017/cts.2023.340</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dhillon</surname>
              <given-names>IS</given-names>
            </name>
            <name name-style="western">
              <surname>Sra</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Generalized nonnegative matrix approximations with Bregman divergences</article-title>
          <source>Proceedings of the 18th International Conference on Neural Information Processing Systems</source>
          <year>2005</year>
          <conf-name>NIPS'05</conf-name>
          <conf-date>December 5-8, 2005</conf-date>
          <conf-loc>Vancouver, BC</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dilsizian</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Siegel</surname>
              <given-names>EL</given-names>
            </name>
          </person-group>
          <article-title>Machine meets biology: a primer on artificial intelligence in cardiology and cardiac imaging</article-title>
          <source>Curr Cardiol Rep</source>
          <year>2018</year>
          <month>10</month>
          <day>18</day>
          <volume>20</volume>
          <issue>12</issue>
          <fpage>139</fpage>
          <pub-id pub-id-type="doi">10.1007/s11886-018-1074-8</pub-id>
          <pub-id pub-id-type="medline">30334108</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11886-018-1074-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Visweswaran</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Divekar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Brasier</surname>
              <given-names>AR</given-names>
            </name>
          </person-group>
          <article-title>Towards team-centered informatics: accelerating innovation in multidisciplinary scientific teams through visual analytics</article-title>
          <source>J Appl Behav Sci</source>
          <year>2018</year>
          <month>11</month>
          <day>05</day>
          <volume>55</volume>
          <issue>1</issue>
          <fpage>50</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1177/0021886318794606"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/0021886318794606</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wooten</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Calhoun</surname>
              <given-names>WJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bhavnani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rose</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Ameredes</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Brasier</surname>
              <given-names>AR</given-names>
            </name>
          </person-group>
          <article-title>Evolution of multidisciplinary translational teams (MTTs): insights for accelerating translational innovations</article-title>
          <source>Clin Transl Sci</source>
          <year>2015</year>
          <month>10</month>
          <volume>8</volume>
          <issue>5</issue>
          <fpage>542</fpage>
          <lpage>52</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25801998"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/cts.12266</pub-id>
          <pub-id pub-id-type="medline">25801998</pub-id>
          <pub-id pub-id-type="pmcid">PMC4575623</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="web">
          <article-title>Hope</article-title>
          <source>St. Vincent's House</source>
          <access-date>2024-10-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.stvhope.org/">https://www.stvhope.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref88">
        <label>88</label>
        <nlm-citation citation-type="web">
          <article-title>Register - All of Us Research Hub</article-title>
          <source>All of Us Research Hub</source>
          <access-date>2024-07-07</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchallofus.org/register/">https://www.researchallofus.org/register/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
