<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v26i1e50890</article-id>
      <article-id pub-id-type="pmid">38289657</article-id>
      <article-id pub-id-type="doi">10.2196/50890</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Tutorial</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Tutorial</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Machine Learning and Health Science Research: Tutorial</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Sáez</surname>
            <given-names>Carlos</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Ren</surname>
            <given-names>Ziyou</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Aczon</surname>
            <given-names>Melissa</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Cho</surname>
            <given-names>Hunyong</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0087-0079</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>She</surname>
            <given-names>Jane</given-names>
          </name>
          <degrees>BA</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Biostatistics</institution>
            <institution>University of North Carolina at Chapel Hill</institution>
            <addr-line>3101 McGavran-Greenberg Hall</addr-line>
            <addr-line>CB #7420</addr-line>
            <addr-line>Chapel Hill, NC, 27599-7420</addr-line>
            <country>United States</country>
            <phone>1 (919) 966 7250</phone>
            <email>jane.she@unc.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8488-4357</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>De Marchi</surname>
            <given-names>Daniel</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9222-8840</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>El-Zaatari</surname>
            <given-names>Helal</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0617-1559</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Barnes</surname>
            <given-names>Edward L</given-names>
          </name>
          <degrees>MPH, MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9894-8796</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Kahkoska</surname>
            <given-names>Anna R</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2701-101X</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Kosorok</surname>
            <given-names>Michael R</given-names>
          </name>
          <degrees>MM, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6070-9738</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Virkud</surname>
            <given-names>Arti V</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0673-5780</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Biostatistics</institution>
        <institution>University of North Carolina at Chapel Hill</institution>
        <addr-line>Chapel Hill, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Division of Gastroenterology and Hepatology</institution>
        <institution>University of North Carolina at Chapel Hill</institution>
        <addr-line>Chapel Hill, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Center for Gastrointestinal Biology and Diseases</institution>
        <institution>University of North Carolina at Chapel Hill</institution>
        <addr-line>Chapel Hill, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Nutrition</institution>
        <institution>University of North Carolina at Chapel Hill</institution>
        <addr-line>Chapel Hill, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Division of Endocrinology and Metabolism</institution>
        <institution>University of North Carolina at Chapel Hill</institution>
        <addr-line>Chapel Hill, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Center for Aging and Health</institution>
        <institution>University of North Carolina at Chapel Hill</institution>
        <addr-line>Chapel Hill, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Kidney Center</institution>
        <institution>University of North Carolina at Chapel Hill</institution>
        <addr-line>Chapel Hill, NC</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Jane She <email>jane.she@unc.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>30</day>
        <month>1</month>
        <year>2024</year>
      </pub-date>
      <volume>26</volume>
      <elocation-id>e50890</elocation-id>
      <history>
        <date date-type="received">
          <day>15</day>
          <month>7</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>11</day>
          <month>10</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>30</day>
          <month>11</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>21</day>
          <month>12</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Hunyong Cho, Jane She, Daniel De Marchi, Helal El-Zaatari, Edward L Barnes, Anna R Kahkoska, Michael R Kosorok, Arti V Virkud. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 30.01.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2024/1/e50890" xlink:type="simple"/>
      <abstract>
        <p>Machine learning (ML) has seen impressive growth in health science research due to its capacity for handling complex data to perform a range of tasks, including unsupervised learning, supervised learning, and reinforcement learning. To aid health science researchers in understanding the strengths and limitations of ML and to facilitate its integration into their studies, we present here a guideline for integrating ML into an analysis through a structured framework, covering steps from framing a research question to study design and analysis techniques for specialized data types.</p>
      </abstract>
      <kwd-group>
        <kwd>health science researcher</kwd>
        <kwd>machine learning pipeline</kwd>
        <kwd>machine learning</kwd>
        <kwd>medical machine learning</kwd>
        <kwd>precision medicine</kwd>
        <kwd>reproducibility</kwd>
        <kwd>unsupervised learning</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>As a brief overview, machine learning (ML) is generally characterized by model complexity and capacity for processing high-dimensional or complicated data forms and is often mentioned as an antonym to traditional statistical learning algorithms. However, this division is not clear, and ML algorithms range from traditional statistical analysis tools such as simple linear regression to cutting-edge deep neural network algorithms. While often used interchangeably with artificial intelligence (AI), ML is a subset of AI and seeks to use data-driven methods to identify patterns and make decisions. This can then be used in the field of AI to allow problem-solving and decision-making.</p>
      <p>ML is becoming increasingly popular in the research community due to the proliferation of complex or unstructured data sets and the increased capacity and access to computing power needed to run these models. ML models can often discover sophisticated and surprising patterns in these data sets that would be difficult to discover using classical methods [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. The health science research domain has been no exception to this paradigm, as the health science fields have an abundance of data well suited for these models, such as genomics sequencing data and electronic health records (EHR) data [<xref ref-type="bibr" rid="ref3">3</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. Applications of ML to the health field can lead to targeted interventions to provide support for health care professionals [<xref ref-type="bibr" rid="ref7">7</xref>]. ML has also become almost indispensable to the fast-growing field of PM, which uses rich patient information to precisely target interventions [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
      <p>This paper provides a sequential framework for health scientists intending to use ML in a research proposal and discusses types of analyses that can be done and factors to consider. It will also include a special introduction to the field of PM, which has become a popular research area with the development of new ML methodologies. Finally, we discuss some unique data types and analysis techniques specific to those application areas. In general, throughout the study design process, documentation and preplanning are highly recommended for the sake of reproducibility of the work carried out. For a visual illustration of the research pipeline flowchart, see <xref rid="figure1" ref-type="fig">Figure 1</xref>. There are also existing pipelines such as MLOps and CRISP used in business and industry settings that may be adapted to health science research fields; however, this paper will follow a framework more commonly seen in health science research. We relegate some technical topics, such as general sample size calculations, model training, and model tuning and validation to <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. Readers are also encouraged to reference other ML primers, such as one for epidemiologists [<xref ref-type="bibr" rid="ref22">22</xref>] and 1 for biologists [<xref ref-type="bibr" rid="ref23">23</xref>].</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Machine learning workflow for a health science research question, from research question refinement to results reporting, with additional considerations. The cyclic nature of the process is reflected in the arrows, as several different iterations may be considered before narrowing down to a decisive pipeline, leading to result reporting.</p>
        </caption>
        <graphic xlink:href="jmir_v26i1e50890_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
    </sec>
    <sec>
      <title>Experimentation</title>
      <p>This section introduces step-by-step core considerations for designing an ML-involved research project.</p>
      <sec>
        <title>Refining Research Questions: What Can Machine Learning Do?</title>
        <p>ML methods can be used to answer questions for studies that may fall within the following categories: prediction, estimation, understanding causal associations, and decision support. ML can also help support main analyses as an auxiliary tool through missing data imputation, inverse propensity score weighting, dimensionality reduction, and variable selection. This last point will be covered further in the Data Collection and Preprocessing section.</p>
        <p>Inquiries in traditional studies are often limited to the discovery and measurement of the size of certain effects or to establishing the causal relationship between variables. These are called estimation and causal inference, respectively. The recent realm of research has also expanded to prediction [<xref ref-type="bibr" rid="ref24">24</xref>], where algorithms can predict an outcome for a patient when given a set of input variables. Functionalities such as estimation, establishing causal relationships, and prediction are meant to, in an indirect manner, support clinical decision-making. However, there are decision-support frameworks that explicitly provide recommendations through reinforcement learning (RL; defined in the section Advanced Concepts). One of the most important applications in the medical domain is PM, where the goal is to provide an optimal treatment for individual patients each with unique characteristics [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
      </sec>
      <sec>
        <title>Prediction</title>
        <p>As a concrete example, suppose a researcher is interested in investigating the health effects of electronic screen time use over several months [<xref ref-type="bibr" rid="ref25">25</xref>]. This is an example of a study where the research question hinges on accurate prediction of the use of a screen. Since it is impractical and unethical to monitor an individual for several months and self-reported measures can be unreliable, the use of ML algorithms for predicting screen time is useful [<xref ref-type="bibr" rid="ref26">26</xref>]. Prediction has also been used in the identification of early cancer diagnoses using image data analysis [<xref ref-type="bibr" rid="ref27">27</xref>]. Classification of patients for disease screening, a prediction task, can be performed with high accuracy using ML.</p>
        <p>Although the accuracy of a predictive algorithm is considered one of the most important virtues, interpretability [<xref ref-type="bibr" rid="ref28">28</xref>] is another important aspect to consider, especially in health science research. Interpretability often comes at the price of reduced accuracy, which is sometimes framed as the “interpretability-accuracy trade-off.” More complex models, which may improve prediction accuracy, maybe less interpretable, as it can be difficult to trace why the model arrived at such a decision, how the predictors relate to the outcome, and how to interpret the results. Interpretability generally is used to mean being able to understand the inner workings of a model, but as evidenced by the previous sentence, it can encompass several different aspects. These can range from overall model structure, ability to explain individual predictors, transparency of decision-making processes, and more. Measuring interpretability is a challenge, as it can be context-dependent for the problem you are working on; more information on interpretability can be found at [<xref ref-type="bibr" rid="ref29">29</xref>]. In the screen time prediction example above, interpretability is not of concern but rather maximizing the prediction accuracy, as it may not be of interest how the algorithm predicted the values, but rather the predicted values themselves.</p>
      </sec>
      <sec>
        <title>Estimation</title>
        <p>ML algorithms can also be used to estimate associations between exposures and health outcomes [<xref ref-type="bibr" rid="ref30">30</xref>]. Examples include calculating the odds ratio of obesity while comparing 2 socioeconomic statuses, measuring the association between physical activity and mortality [<xref ref-type="bibr" rid="ref31">31</xref>], and estimating the association between sociodemographic traits and diabetes prevalence [<xref ref-type="bibr" rid="ref32">32</xref>]. However, the estimation procedures of ML algorithms are often limited to point estimation and usually lack inferential abilities such as <italic>P</italic> values and Bayes factors. Meaning, estimation procedures can usually find an approximate value of a parameter (like an average) through point estimation but are not usually able to output other quantities such as CIs or hypothesis tests which provide information on the population as a whole. This is because models that are nonparametric or complex may not make certain distributional assumptions, which makes quantifying CIs for a point estimate not easily doable. For an investigator wanting to confirm the positive effects of a medical treatment on patient health outcomes, ML often cannot discern whether the estimated effect size is statistically significant or not. Rather, this can be done through classical statistical tests, which possess inferential capabilities. However, this limitation is not the same as generating CIs for model performance, which is a separate procedure and generally more straightforward as model evaluation may involve data splitting or repeated sampling.</p>
        <p>That being said, certain ML algorithms still have the potential for inferential capacity. Recently, a random forest-based framework for judging the statistical significance of heterogeneous treatment effects for individuals with specific covariate values has been developed [<xref ref-type="bibr" rid="ref33">33</xref>]. Additionally, many other algorithms, such as support vector machine (SVM) and <italic>k</italic>-nearest neighbors (<italic>k</italic>-NN), can output CIs and <italic>P</italic> values for estimated effects [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. However, these approaches are, in general, much less efficient than classical statistical tests and thus should be used after carefully considering the trade-off between flexibility (model specification) and efficiency (power of the test).</p>
      </sec>
      <sec>
        <title>Causal Inference</title>
        <p>Understanding causal associations is the activity of investigating the cause of an outcome, such as the occurrence of disease. In the statistical literature, it is known as causal inference, which provides a foundation for establishing causality [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. Research questions related to understanding causal associations include estimation of average or individual treatment effects (ATE and ITE, respectively) and identification of important risk factors or subgroups for a health outcome. A rich literature for causal inference methods has been developed in statistics. For example, when estimating average treatment effects [<xref ref-type="bibr" rid="ref38">38</xref>] from observational data, propensity score matching [<xref ref-type="bibr" rid="ref39">39</xref>] is frequently used, which is often done using flexible models such as random forests [<xref ref-type="bibr" rid="ref40">40</xref>]. However, its use should be carefully considered due to potential small sample size issues and covariate imbalance.</p>
      </sec>
      <sec>
        <title>Study Design Considerations</title>
        <p>Quality of data is a key design consideration for the successful use of ML. Given the complexity of ML, which often involves managing a vast range of input variables coming in various formats, it is crucial to plan the identification, collection, and management of these variables. Data from multiple sources—for example, clinical information, genomics data, and medical images have different dimensions—eventually needs to be aligned for downstream analyses using techniques such as feature concatenation, feature extraction, and tree and metric-based learning, so planning the process ahead of time is essential to consider any feasibility issues [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>].</p>
        <p>In ML studies, missing data are one of the most frequently observed issues that can harm the quality of data and can lead to bias. Thus, planning the data collection process to minimize missing data and setting up quality control checks on data entry errors is essential. Approaches to data missingness will be described in the Data Collection and Preprocessing section.</p>
      </sec>
      <sec>
        <title>Sample Size and Strategies for Sample Size Determination</title>
        <p>In general, ML models with tunable parameters require much larger sample sizes than traditional statistical models to achieve the same level of estimation or prediction accuracy. Since ML models usually have much weaker model assumptions than traditional parametric models, when the dimension of a parameter is much larger, more data are needed for the estimator to determine the model structure on top of estimating the mean outcome or the parameters of interest. The phenomenon when the required sample size grows exponentially with the dimension of the parameter is called the “curse of dimensionality,” which is attributable to the nonparametric nature of ML models.</p>
        <p>This relatively large sample size requirement is not the only issue, but precisely calibrating the required size is another challenge. Unlike traditional clinical trials, where the sample size of a study is planned to achieve a certain amount of power to detect a certain effect size [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>], the sample size determination for ML has a different meaning, and there is no generic framework for it [<xref ref-type="bibr" rid="ref45">45</xref>]. In ML, where the model performance is often measured in terms of prediction accuracy; measures, such as mean squared error and classification error rate, are meant to be controlled under a predefined level, and the sample size that meets such prediction accuracy is to be derived.</p>
        <p>Popular choices of evaluation metrics include mean squared error and <italic>R</italic><sup>2</sup> for continuous outcomes, Brier scores for survival outcomes, classification error rate (accuracy rate) for categorical outcomes, and area under the receiver operating characteristics curve (AUC) for binary outcomes. However, these evaluation metrics should be chosen after consideration of the cost of wrong predictions and the benefits of correct predictions. For example, a model for predicting cancer may have to impose a higher cost for false negative than for false positive. Thus, a true negative rate (TNR) or a partial AUC could be considered for its evaluation measure after considering threshold selection and other possible reporting metrics. There are no “best” evaluation metrics, as this is highly dependent on the problem itself beyond the characterization of a classification or regression framework; differences in metrics can emerge when there are outliers in the data set, model comparison, and differential penalties for errors.</p>
        <p>Although there is no deterministic sample size formula for predictive models, one can fit a learning curve on the training data for a given ML algorithm based on some evaluation measures such as the prediction error rate and AUC, which quantifies the overall accuracy of a binary classification model [<xref ref-type="bibr" rid="ref45">45</xref>]. Essentially, the researcher is required to run the ML algorithm for the pilot data using training data and project the evaluation measure based on the fitted learning curve through the evaluation of the testing data. This evaluation measure is then used to inform the sample size or amount of data needed for the specific accuracy or statistical power desired [<xref ref-type="bibr" rid="ref46">46</xref>].</p>
        <p>To accurately estimate this curve, at least 2 or 3 points are required [<xref ref-type="bibr" rid="ref47">47</xref>]. This means that the researcher is required to take at least 2 subsets of the available data and calculate 2 respective error rates. However, the pilot data might not capture all the biases present in the larger data set, as the sample may not be fully representative of the population or phenomena of interest. The researcher must be wary of generalizations using this pilot data. It is therefore recommended that a statistician trained in ML be present to assist with these technical sample size estimation procedures.</p>
        <p>More details are included in section A of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref21">21</xref>], which also includes information on how to mitigate the large sample requirement in neural networks through augmentation techniques and transfer learning (defined in the section Advanced Concepts).</p>
      </sec>
      <sec>
        <title>Data Collection and Data Preprocessing</title>
        <p>As previously mentioned, EHR, administrative claims, clinical trials, and longitudinal cohort data are major data types in the ML world. However, there are also “specialized data types,” which require their own distinct methods of analysis due to their unique qualities. These include textual or language data, imaging, and genomics, and will be discussed in the Applications section. Due to the highly complex nature of the data being used, ML analyses often involve heavy data preprocessing. This step often requires more time than the main analysis itself and not only includes screening for erratic values, detecting and understanding outliers, and handling of missing values, but also transformation of the data into a software-friendly format, feature scaling, feature selection, dimensionality reduction, and sample splitting for validation, among others [<xref ref-type="bibr" rid="ref48">48</xref>].</p>
        <p>These procedures, while seemingly not important, may bring significant changes to the conclusion. For example, data preprocessing is an essential step for categorical features when using certain gradient boosting algorithms such as XGBoost, as the algorithm requires the categorical variables to be coded through mean coding or one hot coding before use in the model. Additionally, feature scaling would change the results of any methods involving Euclidean distance metrics such as principal component analysis (PCA), <italic>k</italic>-means, and <italic>k</italic>-NN.</p>
        <p>As mentioned in the section Refining Research Questions: What Can Machine Learning Do? ML can be used as an auxiliary tool for missing data imputation [<xref ref-type="bibr" rid="ref49">49</xref>], dimensionality reduction [<xref ref-type="bibr" rid="ref50">50</xref>] before regression analysis, and variable selection, all of which can make an analysis more manageable.</p>
        <p>Missing data, which typically arises in survival analysis, longitudinal studies, among other scientific studies, has great potential to create statistical bias if not accounted for in an auxiliary analysis [<xref ref-type="bibr" rid="ref51">51</xref>]. Simply discarding observations with missing data may lead to selection bias and reduced sample size, resulting in incorrect estimation of relationships. Instead, the mechanism behind the missing data can be accounted for through an auxiliary analysis to mitigate the effects of the bias using tools such as imputation and maximum likelihood estimation. See, for example, “missForest” for imputation based on random forests [<xref ref-type="bibr" rid="ref52">52</xref>]. As an example, [<xref ref-type="bibr" rid="ref49">49</xref>] provides a real-use case of how ML methods can be used to impute missing data in a breast cancer problem.</p>
      </sec>
      <sec>
        <title>Algorithm and Model Selection</title>
        <p>The choice of an ML method largely depends on the type of task and data type. For example, linear discriminant analysis (LDA) and <italic>k</italic>-means clustering can only be used with continuous predictors; SVM and support vector regression can be used for classification and regression problems, respectively; and random forests and neural networks are capable of both classification and regression. <xref ref-type="table" rid="table1">Table 1</xref> lists commonly available algorithms in each category and summarizes their benefits and drawbacks.</p>
        <p>Once the candidate algorithms are identified, the choice of the algorithm may be driven by the scientific inquiry, as discussed in the section Refining Research Questions: What Can Machine Learning Do? Additional factors for algorithm choice may include computing resources, data limitations, and data assumptions. <xref rid="figure2" ref-type="fig">Figure 2</xref> gives a list of common ML algorithms and the purposes they may be used for. The nature of the scientific study will determine the importance of interpretability in the prediction of particular phenomena. A “black box” predictive model may not clearly explain why such predictions were made, only what the predictions are [<xref ref-type="bibr" rid="ref53">53</xref>]. For clinicians who want to attribute a specific cause of an output, these methods may be less suited for their research question, and it is suggested to use a more interpretable model. As an extreme example, consider using an ML algorithm to support the decision of no amputation, minor amputation, or major amputation for a patient with diabetic foot ulcer. One can imagine that an interpretable ML algorithm must be preferred, as was proposed in [<xref ref-type="bibr" rid="ref54">54</xref>], as the decision-making process needs to be clear before an amputation is carried out.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Benefits and drawbacks of common machine learning methods in supervised and unsupervised settings. This list is not exhaustive and includes popular machine-learning algorithms in each category.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="170"/>
            <col width="0"/>
            <col width="350"/>
            <col width="0"/>
            <col width="450"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Methods</td>
                <td colspan="2">Strengths</td>
                <td>Limitations</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="6">
                  <bold>Benefits and drawbacks of some supervised methods</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Logistic regression and linear regression</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Interpretable</p>
                    </list-item>
                    <list-item>
                      <p>Easy implementation</p>
                    </list-item>
                  </list>
                </td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Overfitting with highly correlated data (use variable selection or shrinkage methods)</p>
                    </list-item>
                    <list-item>
                      <p>Poor performance for nonlinearly separable data</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Naive Bayes</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Performs well even without conditional independence</p>
                    </list-item>
                    <list-item>
                      <p>Easy implementation</p>
                    </list-item>
                  </list>
                </td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Simple; outperformed by well-tuned, more complex models</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td><italic>k</italic>-nearest neighbors</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Nonparametric (no model assumptions needed)</p>
                    </list-item>
                    <list-item>
                      <p>High level of flexibility; performs well for nonlinear boundaries</p>
                    </list-item>
                  </list>
                </td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Low interpretability</p>
                    </list-item>
                    <list-item>
                      <p>Poor performance for high-dimensional data</p>
                    </list-item>
                    <list-item>
                      <p>Difficulty dealing with missing values</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Support vector machine</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Performs well with high-dimensional data and nonlinear boundaries</p>
                    </list-item>
                  </list>
                </td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Low interpretability</p>
                    </list-item>
                    <list-item>
                      <p>Poor performance for imbalanced data</p>
                    </list-item>
                    <list-item>
                      <p>Usually outperformed by newer methods</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Decision trees</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Interpretable for trivial data sets</p>
                    </list-item>
                    <list-item>
                      <p>Nonparametric (no model assumptions needed)</p>
                    </list-item>
                    <list-item>
                      <p>Works with nonlinear relationships</p>
                    </list-item>
                    <list-item>
                      <p>Classification for more than 2 classes</p>
                    </list-item>
                  </list>
                </td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Prone to overfitting</p>
                    </list-item>
                    <list-item>
                      <p>Difficult to interpret for nontrivial data sets</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Random forest</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Handles high-dimensional data well</p>
                    </list-item>
                    <list-item>
                      <p>Reduces overfitting from decision trees</p>
                    </list-item>
                    <list-item>
                      <p>Reduces variance</p>
                    </list-item>
                  </list>
                </td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Low interpretability</p>
                    </list-item>
                    <list-item>
                      <p>Poor performance for sparse data</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Gradient boosted trees</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Increased accuracy over random forests</p>
                    </list-item>
                  </list>
                </td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>More difficult to implement due to tuning parameter selection</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Artificial neural networks</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Works well with many data types (images, text, audio, etc)</p>
                    </list-item>
                    <list-item>
                      <p>Adaptable architecture</p>
                    </list-item>
                  </list>
                </td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Low interpretability</p>
                    </list-item>
                    <list-item>
                      <p>Overfitting if trained too long</p>
                    </list-item>
                    <list-item>
                      <p>Requires a great deal of data</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Benefits and drawbacks of some unsupervised methods</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td><italic>k</italic>-means clustering</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Fast, easy implementation</p>
                    </list-item>
                  </list>
                </td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Only quantitative data</p>
                    </list-item>
                    <list-item>
                      <p>No clear best way to choose k</p>
                    </list-item>
                    <list-item>
                      <p>Poor performance for noncircular cluster</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hierarchical cluster</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Reproducible</p>
                    </list-item>
                    <list-item>
                      <p>Visually interpretable by dendrograms</p>
                    </list-item>
                    <list-item>
                      <p>Cluster shape not assumed to be globular</p>
                    </list-item>
                  </list>
                </td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Poor performance on high-dimensional data</p>
                    </list-item>
                    <list-item>
                      <p>Hierarchy level must be selected</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Gaussian mixture models</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Flexibility since clusters can have irregular shapes</p>
                    </list-item>
                    <list-item>
                      <p>No assumption of cluster number or level</p>
                    </list-item>
                    <list-item>
                      <p>Accommodates mixed cluster membership</p>
                    </list-item>
                  </list>
                </td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Poor performance on high-dimensional data</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Linear discriminant analysis</td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Interpretable</p>
                    </list-item>
                    <list-item>
                      <p>Can lower model variance over logistic regression if model assumptions are met</p>
                    </list-item>
                  </list>
                </td>
                <td colspan="2">
                  <list list-type="bullet">
                    <list-item>
                      <p>Can only be used with continuous predictors</p>
                    </list-item>
                    <list-item>
                      <p>Poor performance for nonlinearly separable data (try quadratic discriminant analysis)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Commonly used algorithms in the supervised setting by algorithm type distinguished between classification and regression problems, as well as methods used in unsupervised learning.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e50890_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Being too open-ended about model possibilities may lead to nonreproducibility or phenomena analogous to <italic>P</italic>-hacking, where researchers may choose the model that leads to the highest accuracy for the data at hand after trials of multiple approaches. This highlights the importance of having a held-out test set, which is used only at the end of model development to report model performance results, as well as having an appropriate justification for model selection. More details about a held-out test set can be found in the Hyperparameter and Model Validation section. It is important to be specific enough about the goals of the analysis to justify the use of different algorithms. At the same time, being too specific can put too many undesired constraints on research, unduly limiting the use of adequate algorithms and models [<xref ref-type="bibr" rid="ref55">55</xref>].</p>
      </sec>
      <sec>
        <title>Hyperparameter Tuning and Model Validation</title>
        <p>Assuming an appropriate model has been chosen, hyperparameter tuning and model validation become the next steps for an ML practitioner. In section B of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref21">21</xref>], we provide guidelines for tuning hyperparameters for 2 popular ML methods—tree-based methods and neural networks. The relatively high performance of these models is achieved by adequately tuning the hyperparameters.</p>
        <p>Model performance assessment metrics are used to determine how well a trained model performs on new, unseen data. Popular model assessment metrics include in regression: <italic>R</italic><sup>2</sup> values, mean absolute error, mean square error, and in classification: recall, <italic>F</italic><sub>1</sub>-score, and AUC. Beyond these metrics, aspects of model performance can also include ease of use and deployment feasibility. In many health care cases, understanding how a model reached the conclusion as well as interpreting the results of the conclusion may be preferred over blackbox models, as medical decisions are made based on the results of the model. The model deployment aspect focuses on its practical use; a complicated model may not be used in resource-constrained settings, so its use may not be feasible.</p>
        <p>Typically, the preprocessed data are split into separate training and testing sets. The term “validation set” is often used interchangeably with the term “test set” and usually refers to a portion of the data that are not used in training the model. The model is evaluated on the test set to give an unbiased estimate of model performance on unseen data. This test set cannot be touched before model fitting and is not used for training the model or tuning model parameters.</p>
        <p>In some literature, the training data themselves may also be split into 2 separate data sets: one, dubbed the “training set,” is used to train the models to get parameter estimates, and the other, the “validation set,” is used to help tune parameters. Therefore, rather than a split into a training and testing set as previously mentioned, we have a training, validation, and testing split, where the test set is held out until model performance evaluation. The interchangeable use of “test set” and “validation set” in this case may be confusing, as they do not refer to the same thing when data are portioned this way—one must be careful in reading to understand which scenario is occurring.</p>
        <p>When partitioning data, it is important for the test set to be representative of the data rather than having different characteristics than the training set. There are various factors to consider when forming a test set, which can depend on the use case. For example, one may want the training and test sets to contain records from different individuals for diagnosis purposes, or for the training and test sets to contain observations from different time points on the same individuals for prognosis. Saeb et al [<xref ref-type="bibr" rid="ref56">56</xref>] discuss examples of using different types of splitting in cross-validation and how results can differ based on the partitioning.</p>
        <p>Section B of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref21">21</xref>] continues to discuss how to validate these models using <italic>k</italic>-fold cross-validation, which is a validation method that uses a given sample, assuming collecting additional data is difficult. For high-dimensional data where <italic>k</italic>-fold cross-validation is infeasible to implement due to computational costs, an alternative approach is introduced. It should be noted that cross-validation methods still require a held-out test set to evaluate model performance at the very end; <italic>k</italic>-fold cross-validation is used on the training data set to tune the parameters, but it does not replace the need for a separate testing set. An introduction to how ML models are trained is also discussed in section C of <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref21">21</xref>] for additional information and completion in the understanding of model training.</p>
      </sec>
    </sec>
    <sec>
      <title>Results and Reproducibility</title>
      <p>The final step of any project is to report the results. Luo and colleagues [<xref ref-type="bibr" rid="ref57">57</xref>] set up reporting standards of ML predictive model-based research for biomedical researchers, which include a list of reporting items to be included. Reporting of such items is essential to promoting reproducibility in research. Among the items are details including the nature of the study along with a background, objectives, clinical rationale, data sources, type of modeling, inclusion and exclusion criteria, time span, model validation strategies, handling of missing values, cleaning and transformation, candidate modeling techniques with justification, model selection criteria, clinical implications, and model limitations [<xref ref-type="bibr" rid="ref57">57</xref>].</p>
      <p>Several of these reporting items have been discussed in the paper and fall under the outlined categories of research question refinement, study design considerations, data collection and preprocessing, algorithm and model selection, hyperparameter tuning, and model validation. The goal of the list of reporting standards for predictive modeling is to encourage transparency and reproducibility to ensure credibility in the scientific community and the methodological soundness of research.</p>
      <p>The need for transparent reporting is even more apparent when considering the nuances of ML. While studies involving ML have experimental design steps that overlap with general study considerations such as refining a research question, study design, and data collection, the use of ML in health science studies requires ML-specific considerations in terms of quality and size of data, adequacy of methods, and reproducibility. These issues are inherent in ML-involved research owing to both the complexity of data and ML models and a wide spectrum of ML methods. Readers are encouraged to read the literature [<xref ref-type="bibr" rid="ref58">58</xref>-<xref ref-type="bibr" rid="ref60">60</xref>] for guidelines on general study considerations. Therefore, there is a necessity for conscientious approaches to reporting.</p>
      <p>Within each ML method, there are usually one or more hyperparameters, such as the depth and node size in tree methods and the penalty term in kernel regression [<xref ref-type="bibr" rid="ref61">61</xref>]. Cherry-picking a hyperparameter after looking at the data multiple times may result in irreproducibility. This is why the held-out test set can only be used for result reporting and should not be used for further model development. As previously mentioned, for the sake of reproducibility, keeping documentation of the research pipeline from start to finish as outlined is also necessary.</p>
    </sec>
    <sec>
      <title>Application</title>
      <p>This section includes specialized data types in ML.</p>
      <sec>
        <title>Natural Language Processing</title>
        <p>Medical notes of physicians may contain important information beyond quantitative clinical records. They, however, are not readily analyzable without processing such as transcription and topic extraction. Natural language processing (NLP) does what was previously considered impossible by processing such nonstandard form of massive data into a readily analyzable format, opening huge opportunities for health science research.</p>
        <p>NLP as a field has undergone a revolution since 2018. The seminal paper, “BERT” [<xref ref-type="bibr" rid="ref62">62</xref>], delivered unprecedented performance on almost every major language task. NLP models using transformers (defined in the section Advanced Concepts), such as BERT and GPT [<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref64">64</xref>], can be used for various language tasks, including classification, summarization, imputation, and prediction. The most common and useful tasks in medical NLP usually deal with hospital documents and patient interactions. For instance, NLP models can be used to automatically transcribe patient conversations, predict disease from medical notes, or impute missing values in medical forms [<xref ref-type="bibr" rid="ref65">65</xref>]. There are many high-quality models trained on massive text corpora that can, out of the box, deliver state-of-the-art performance on almost any task.</p>
        <p>Therefore, the first step in any NLP project is to select a pretrained model closest to the language domain being used and perform transfer learning. Transfer learning is where a model pretrained on 1 task is then trained on a related but different task. For example, for medical tasks, “Med-BERT: pretrained contextualized embeddings on large-scale structured EHR for disease prediction” and “SciBERT: a pretrained language model for scientific text” may be of use, as they are trained on similar language as is used in medical contexts [<xref ref-type="bibr" rid="ref60">60</xref>,<xref ref-type="bibr" rid="ref61">61</xref>,<xref ref-type="bibr" rid="ref66">66</xref>]. The original BERT model will also work well for most purposes. The common structure of language and the size of most of these training data sets (terabytes for some models) mean that a general model will have almost certainly been exposed to any sort of text problem a researcher may be interested in due to the sheer breadth of data.</p>
        <p>The next step is to preprocess the data so that text is converted into simple numeric tokens that can be used as inputs and process those tokens into small sets for the model to interpret. Once this is done, the model can be fine-tuned on the new data. This is done by taking the previously selected pretrained model and carefully training it with a low learning rate on the new data. Once this is done, the model should be ready for use. Extreme care needs to be taken to derive an optimal train and test split.</p>
      </sec>
      <sec>
        <title>Imaging</title>
        <p>Imaging research has long been the most high-profile ML task. High-quality benchmark data sets such as the ImageNet challenge have provided robust methods for model assessment with useful pretrained networks for transfer learning [<xref ref-type="bibr" rid="ref67">67</xref>,<xref ref-type="bibr" rid="ref68">68</xref>]. The uses of imaging in biomedical applications are myriad. Diagnostics, such as automatic reading and classification of radiological scans or tissue biopsies, are an active area of research. Computer-assisted decision support, where ML algorithms mark anomalous areas for clinicians to investigate, is also relatively well developed. Each use case often requires highly specific knowledge and training data; we leave the specifics to clinical experts.</p>
        <p>Convolutional neural networks are a type of deep learning model heavily used in image analyses, such as medical imaging. Convolutional neural networks can extract patterns from image pixels and are thus widely used in abnormality detection, segmentation, and classification [<xref ref-type="bibr" rid="ref69">69</xref>].</p>
        <p>For imaging, as with language, it is strongly encouraged to take advantage of transfer learning. High-quality models are available on many tasks. In addition, vision has demonstrated similar properties as language, and seemingly unconnected tasks often turn out to be very similar, such as categorizing pastries and segmenting tumors. Even if the images in question are very different sizes, it can still be effective to simply resize them to fit the network in question. As in all things, the best strategy is simply to experiment [<xref ref-type="bibr" rid="ref70">70</xref>].</p>
      </sec>
      <sec>
        <title>Genomics</title>
        <p>With its high-dimensional nature and the growing availability of large-scale data, genomics has become one of the largest research areas where ML is used [<xref ref-type="bibr" rid="ref71">71</xref>]. The capacity of traditional statistics is often limited without the support of ML, especially in “multi-omics,” where multiple modes of genomics data, such as DNA-seq, RNA-seq, ChIP-seq, proteomics, and metagenomics, are analyzed together.</p>
        <p>ML is used in genomics in multiple ways. For example, ML can be used to predict a certain gene’s expression level given the corresponding DNA-seq information. Genome-wide association studies (GWAS) that aim to identify genetic variants associated with a medical condition of interest, frequently involve ML algorithms such as neural networks and random forests [<xref ref-type="bibr" rid="ref72">72</xref>]. Zou et al [<xref ref-type="bibr" rid="ref73">73</xref>] provide more examples of deep learning applications to genomics.</p>
        <p>The usefulness of ML as an auxiliary tool should not be underestimated. The overwhelming number of genes is often screened using the variable importance of random forests before downstream analyses. High-dimensional features can be reduced using autoencoders [<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref75">75</xref>] to lower-resolution data, which can then be analyzed using traditional statistical analysis tools. Graphical illustrations of the data can also be created through 2D or 3D summaries using algorithms such as tSNE and PCoA [<xref ref-type="bibr" rid="ref76">76</xref>,<xref ref-type="bibr" rid="ref77">77</xref>].</p>
        <p>Despite its broad capacity in genomics research and ability to handle high-dimensional data, ML has limitations. In genomics data, the number of features outnumbering the sample size, or high dimensionality, is a commonly seen attribute; even with the use of ML, the relatively small sample size can cause reliability and reproducibility issues.</p>
      </sec>
      <sec>
        <title>Precision Medicine</title>
        <p>As previously mentioned, the goal of the research question of interest may be to indirectly support clinical decision-making. RL is a subset of ML that explicitly provides recommendations for decision-making at sequential time points. PM is a field where such algorithms can be applied to make treatment recommendations for individuals according to their unique characteristics.</p>
        <p>PM starts from patient heterogeneity, where reactions to treatment vary from patient to patient [<xref ref-type="bibr" rid="ref78">78</xref>]. For many illnesses, no panacea exists. PM seeks to recommend different treatment options for unique individuals based on their characteristics; this is formally called individualized treatment rules (ITRs) [<xref ref-type="bibr" rid="ref79">79</xref>,<xref ref-type="bibr" rid="ref80">80</xref>]. ITR forms the basis of PM by providing the best treatment recommendations tailored for each patient, as treatment effects can be heterogeneous among individuals. These rules are best identified with rich information about patients such as sociodemographic, clinical, and genomic data. Recently, a wealth of ITR methods have been developed [<xref ref-type="bibr" rid="ref79">79</xref>-<xref ref-type="bibr" rid="ref82">82</xref>].</p>
        <p>Health care professionals and clinicians are often faced with treating a patient multiple times based on changes in response. For example, researchers can plan adaptive intervention programs for weight loss where later interventions are adjusted depending on responses to the previous treatment [<xref ref-type="bibr" rid="ref83">83</xref>]. Such dynamic strategies are called dynamic treatment regimes (DTRs) [<xref ref-type="bibr" rid="ref84">84</xref>,<xref ref-type="bibr" rid="ref85">85</xref>]. DTRs aim to provide tailored decisions over more than 1 time point based on subject characteristics and their evolving contexts so that a long-term outcome of interest is optimized. The literature on this subtopic is fast-growing [<xref ref-type="bibr" rid="ref86">86</xref>-<xref ref-type="bibr" rid="ref88">88</xref>].</p>
        <p>For example, patients with cancer may be given frontline chemotherapy followed by a salvage treatment if the response to the initial treatment is not successful [<xref ref-type="bibr" rid="ref89">89</xref>]. A DTR can then be used to account for potential changes in a patient so that optimal recommendations can be made for each patient for unique stages in their disease to optimize a long-term outcome of interest, such as patient survival. An estimation of such DTR may require a large sample size. To address this issue, investigators can design a multistage randomized trial in an adaptive way through a sequential multiple assignment randomized trial (SMART) [<xref ref-type="bibr" rid="ref83">83</xref>,<xref ref-type="bibr" rid="ref90">90</xref>]. For instance, if a patient responded well to the first treatment, increasing the dose may not be particularly effective, and assigning a continued or decreased dose would be worth exploring. ITR and DTR are decision-support tools that provide the best treatment recommendations for patients.</p>
        <p>SMARTs are an adaptive study design approach to finding a DTR. While SMARTs are used only for a fixed number of time points, the number of decision time points could be arbitrarily large for some problems. This is formally called an infinite-horizon setting. For example, artificial pancreas programs decide the amount of insulin infused every minute, so that numerous actions are taken even during a day [<xref ref-type="bibr" rid="ref91">91</xref>]. A class of DTRs that provide essentially continuous recommendations is called just-in-time adaptive intervention [<xref ref-type="bibr" rid="ref92">92</xref>]. A Markov decision process (MDP) is often used for these problems. MDP is a class of dynamic decision rules that base their decision only on the current state information, not necessarily depending on the history of the change. V-learning [<xref ref-type="bibr" rid="ref93">93</xref>] is an example of such an infinite-horizon DTR that uses MDP structure.</p>
        <p>PM has a strong connection with ML. Treatment effects are often dictated by thousands of patient characteristics, such as sociodemographic, genetic, clinical, and behavioral factors. Genetic factors alone are high-dimensional and can contain millions of traits. The goal of PM is to recommend the best treatment for a patient given their unique characteristics by providing them with an ITR. For example, a clinician may be interested in delineating an optimal ITR for each patient that best achieves cancer remission [<xref ref-type="bibr" rid="ref94">94</xref>].</p>
      </sec>
    </sec>
    <sec>
      <title>Limitations and Optimizations</title>
      <p>ML models trained on data that inaccurately represent the population cause fundamental issues such as biased prediction and suboptimality of decisions. Data, where the healthy population is poorly represented, may not be used to make a conclusion for the general population without adjustment. As ML can be used to support decision-making processes, it is also crucial that these decisions arising from the data are not discriminatory toward certain populations [<xref ref-type="bibr" rid="ref95">95</xref>]. In the ML world, this term is called fairness. When the underlying data are biased, the ML algorithms that are trained on such data may produce biased results, which can lead to inaccurate predictions or withholding of resources. Bias in data may result from measurement bias, representation bias, and sampling bias, among others [<xref ref-type="bibr" rid="ref96">96</xref>,<xref ref-type="bibr" rid="ref97">97</xref>]. As an example, unbalanced gender data in the medical imaging field has led to algorithmic underperformance [<xref ref-type="bibr" rid="ref98">98</xref>]. This discussion should be considered in the data quality assessment when planning data collection.</p>
    </sec>
    <sec>
      <title>Advanced Concepts</title>
      <sec>
        <title>Transformers</title>
        <p>Transformers in the context of NLP are a type of deep learning model architecture that was first introduced by Vaswani in 2017 [<xref ref-type="bibr" rid="ref63">63</xref>] and have outperformed other model types such as neural networks in both language generation and language interpretation [<xref ref-type="bibr" rid="ref99">99</xref>]. Transformer models have a unique self-attention mechanism where the model can weigh the importance of different pieces of input data.</p>
      </sec>
      <sec>
        <title>Transfer Learning</title>
        <p>Transfer learning is the process of taking knowledge from one task and applying it to a different task. This can be useful in several scenarios, such as when training data for models can be difficult to collect or it is computationally expensive to train a new model. In such cases, a pretrained model used in one task can then be trained using data from a different but related task, and the information learned from the previous task can be useful in the new task. This can have reduced data requirements and improved performance as opposed to training a brand-new model, especially when using large, pretrained, publicly available models [<xref ref-type="bibr" rid="ref100">100</xref>].</p>
      </sec>
      <sec>
        <title>Reinforcement Learning</title>
        <p>RL is a type of ML focused on training an algorithm to make sequential decisions in potentially changing environments to maximize a cumulative reward [<xref ref-type="bibr" rid="ref101">101</xref>]. An agent, or decision maker, will receive some quantification of the current environment, also known as the state; the agent will then take an action that will change the state of the environment. The value associated with taking the action and transitioning to the next state is quantified by a “reward”; the agent should choose actions to maximize long-term reward. The goal may be to find the optimal sequence of actions to take to maximize the long-term reward. An application of this is decision support, which has previously been discussed. Other applications of RL range from PM to the development of self-driving cars to financial trading to the creation of ChatGPT. Those interested in the applications of RL in health care should see reference [<xref ref-type="bibr" rid="ref102">102</xref>] for examples of use and [<xref ref-type="bibr" rid="ref103">103</xref>] for guidelines of use.</p>
      </sec>
    </sec>
    <sec>
      <title>Outlook</title>
      <p>The field of ML has a vast trove of tools and resources for use. Its potential, though impressive and exciting, can also be a drawback, as the inherent flexibility in the analysis process gives room for the researcher to arbitrarily or questionably choose methods that result in overfitting and false discovery. This paper has provided a framework for steps involved in using ML in research, discusses analyses for specialized data formats, reviews decision support and bias in ML, and introduces PM, a popular field in the health research domain. Consulting ML experts throughout the process will not only streamline the analysis but also play a large role in legitimizing justifications for choice selections.</p>
      <p>Furthermore, the paper has highlighted the importance of preplanned documentation to ensure transparency and foster credibility within the scientific community. The incorporation of concrete examples within the health care domain, in addition to the provision of techniques involved in specialized data types, illustrates the vast applications of ML methodologies and their potential impact in the health science field.</p>
      <p>Overall, the specifics of different data types and the wide variety of research goals make it difficult to make more specific recommendation guidelines. However, major ML considerations and how to approach them are discussed, with specific examples. While this paper provides a general recommended research framework and major considerations for the use of ML, it is not comprehensive, as the aim was to provide a general overview of potential methods and considerations.</p>
      <p>While ML has strong performance potential in a variety of situations, its use needs to be carefully planned through the aforementioned steps and justified to obtain the best results, as ML cannot overcome poor study design or data quality despite all its virtues. By acknowledging these limitations, the research community can better strive for high-quality data and reproducible results to continue driving innovation in society.</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Supplementary information on general sample size calculations, model training, and model tuning and validation.</p>
        <media xlink:href="jmir_v26i1e50890_app1.docx" xlink:title="DOCX File , 34 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ATE</term>
          <def>
            <p>average treatment effects</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">AUC</term>
          <def>
            <p>area under the receiver operating characteristics curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">DTR</term>
          <def>
            <p>dynamic treatment regime</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">GWAS</term>
          <def>
            <p>genome-wide association studies</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">ITE</term>
          <def>
            <p>individual treatment effects</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">ITR</term>
          <def>
            <p>individualized treatment rule</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">k-NN</term>
          <def>
            <p>k-nearest neighbors</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">LDA</term>
          <def>
            <p>linear discriminant analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">MDP</term>
          <def>
            <p>Markov decision process</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">PCA</term>
          <def>
            <p>principal component analysis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">PM</term>
          <def>
            <p>precision medicine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">RL</term>
          <def>
            <p>reinforcement learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">SMART</term>
          <def>
            <p>sequential multiple assignment randomized trial</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">SVM</term>
          <def>
            <p>support vector machine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb19">TNR</term>
          <def>
            <p>true negative rate</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>JS, DDM, HE, and MRK were supported in part by the National Center for Advancing Translational Sciences, National Institutes of Health (grant UL1TR002489).</p>
      <p>ARK is supported by the National Center for Advancing Translational Sciences, National Institutes of Health (grant KL2TR002490). The content is solely the responsibility of the authors and does not necessarily represent the official views of the National Institutes of Health. ARK also reports receiving research grants from the Diabetes Research Connection and the American Diabetes Association and a prize from the National Academy of Medicine outside the submitted work.</p>
      <p>AVV is supported by the National Institutes of Health T32 grant for the UNC Kidney Center.</p>
      <p>ELB is supported by the National Institutes of Health (grant K23DK127157).</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>Data sharing is not applicable to this article as no data sets were generated or analyzed during this study.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>HC, JS, DDM, HE, and MRK were responsible for paper concept and design. HC, JS, DDM, and HE contributed to the drafting of the manuscript. AVV and MRK are joint senior authors. All authors were involved in the critical revision of the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>MI</given-names>
            </name>
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>TM</given-names>
            </name>
          </person-group>
          <article-title>Machine learning: trends, perspectives, and prospects</article-title>
          <source>Science</source>
          <year>2015</year>
          <volume>349</volume>
          <issue>6245</issue>
          <fpage>255</fpage>
          <lpage>260</lpage>
          <pub-id pub-id-type="doi">10.1126/science.aaa8415</pub-id>
          <pub-id pub-id-type="medline">26185243</pub-id>
          <pub-id pub-id-type="pii">349/6245/255</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Obermeyer</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Emanuel</surname>
              <given-names>EJ</given-names>
            </name>
          </person-group>
          <article-title>Predicting the future—big data, machine learning, and clinical medicine</article-title>
          <source>N Engl J Med</source>
          <year>2016</year>
          <volume>375</volume>
          <issue>13</issue>
          <fpage>1216</fpage>
          <lpage>1219</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27682033"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMp1606181</pub-id>
          <pub-id pub-id-type="medline">27682033</pub-id>
          <pub-id pub-id-type="pmcid">PMC5070532</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beam</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>IS</given-names>
            </name>
          </person-group>
          <article-title>Big data and machine learning in health care</article-title>
          <source>JAMA</source>
          <year>2018</year>
          <volume>319</volume>
          <issue>13</issue>
          <fpage>1317</fpage>
          <lpage>1318</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2017.18391</pub-id>
          <pub-id pub-id-type="medline">29532063</pub-id>
          <pub-id pub-id-type="pii">2675024</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wiens</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Saria</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sendak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>VX</given-names>
            </name>
            <name name-style="western">
              <surname>Doshi-Velez</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Heller</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kale</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Saeed</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ossorio</surname>
              <given-names>PN</given-names>
            </name>
            <name name-style="western">
              <surname>Thadaney-Israni</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Goldenberg</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Do no harm: a roadmap for responsible machine learning for health care</article-title>
          <source>Nat Med</source>
          <year>2019</year>
          <volume>25</volume>
          <issue>9</issue>
          <fpage>1337</fpage>
          <lpage>1340</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-019-0548-6</pub-id>
          <pub-id pub-id-type="medline">31427808</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-019-0548-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greely</surname>
              <given-names>HT</given-names>
            </name>
          </person-group>
          <article-title>The uneasy ethical and legal underpinnings of large-scale genomic biobanks</article-title>
          <source>Annu Rev Genomics Hum Genet</source>
          <year>2007</year>
          <volume>8</volume>
          <fpage>343</fpage>
          <lpage>364</lpage>
          <pub-id pub-id-type="doi">10.1146/annurev.genom.7.080505.115721</pub-id>
          <pub-id pub-id-type="medline">17550341</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tryka</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sturcke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>ZY</given-names>
            </name>
            <name name-style="western">
              <surname>Ziyabari</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Popova</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Sharopova</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kimura</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Feolo</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>NCBI's Database of Genotypes and Phenotypes: dbGaP</article-title>
          <source>Nucleic Acids Res</source>
          <year>2014</year>
          <volume>42</volume>
          <issue>Database issue</issue>
          <fpage>D975</fpage>
          <lpage>d979</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24297256"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkt1211</pub-id>
          <pub-id pub-id-type="medline">24297256</pub-id>
          <pub-id pub-id-type="pii">gkt1211</pub-id>
          <pub-id pub-id-type="pmcid">PMC3965052</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wiens</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shenoy</surname>
              <given-names>ES</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for healthcare: on the verge of a major shift in healthcare epidemiology</article-title>
          <source>Clin Infect Dis</source>
          <year>2018</year>
          <volume>66</volume>
          <issue>1</issue>
          <fpage>149</fpage>
          <lpage>153</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29020316"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/cid/cix731</pub-id>
          <pub-id pub-id-type="medline">29020316</pub-id>
          <pub-id pub-id-type="pii">4085880</pub-id>
          <pub-id pub-id-type="pmcid">PMC5850539</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kosorok</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Laber</surname>
              <given-names>EB</given-names>
            </name>
          </person-group>
          <article-title>Precision medicine</article-title>
          <source>Annu Rev Stat Appl</source>
          <year>2019</year>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>263</fpage>
          <lpage>286</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.annualreviews.org/doi/10.1146/annurev-statistics-030718-105251"/>
          </comment>
          <pub-id pub-id-type="doi">10.1146/annurev-statistics-030718-105251</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Choy</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Do</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>How much data is needed to train a medical image deep learning system to achieve necessary high accuracy?</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on November 19, 2015</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1511.06348</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="web">
          <article-title>Incorporating nesterov momentum into adam</article-title>
          <source>International Conference of Learning Representations</source>
          <access-date>2024-01-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://openreview.net/pdf?id=OM0jvwB8jIp57ZJjtNEZ">https://openreview.net/pdf?id=OM0jvwB8jIp57ZJjtNEZ</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smilkov</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Thorat</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Viégas</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wattenberg</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>SmoothGrad: removing noise by adding noise</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on June 12, 2017</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1706.03825</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Akiba</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sano</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yanase</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ohta</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Koyama</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Optuna: A next-generation hyperparameter optimization framework</article-title>
          <year>2019</year>
          <conf-name>Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery Data Mining</conf-name>
          <conf-date>August 4-8, 2019</conf-date>
          <conf-loc>Anchorage, AK</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3292500.3330701</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shorten</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Khoshgoftaar</surname>
              <given-names>TM</given-names>
            </name>
          </person-group>
          <article-title>A survey on image data augmentation for deep learning</article-title>
          <source>J Big Data</source>
          <year>2019</year>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>60</fpage>
          <pub-id pub-id-type="doi">10.1186/s40537-019-0197-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Transfer learning with convolutional neural networks for small sample size problem in machinery fault diagnosis</article-title>
          <source>Proceedings of the Institution of Mechanical Engineers, Part C: Journal of Mechanical Engineering Science</source>
          <year>2019</year>
          <volume>233</volume>
          <issue>14</issue>
          <fpage>5131</fpage>
          <lpage>5143</lpage>
          <pub-id pub-id-type="doi">10.1177/0954406219840381</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tsinganos</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Cornelis</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Cornelis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jansen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Skodras</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Data augmentation of surface electromyography for hand gesture recognition</article-title>
          <source>Sensors (Basel)</source>
          <year>2020</year>
          <volume>20</volume>
          <issue>17</issue>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=s20174892"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/s20174892</pub-id>
          <pub-id pub-id-type="medline">32872508</pub-id>
          <pub-id pub-id-type="pii">s20174892</pub-id>
          <pub-id pub-id-type="pmcid">PMC7506981</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stone</surname>
              <given-names>CJ</given-names>
            </name>
          </person-group>
          <article-title>Optimal rates of convergence for nonparametric estimators</article-title>
          <source>Ann Stat</source>
          <year>1980</year>
          <fpage>1348</fpage>
          <lpage>1360</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://sites.stat.washington.edu/courses/stat527/s14/readings/Stone_Annals_1980.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Varma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Bias in error estimation when using cross-validation for model selection</article-title>
          <source>BMC Bioinformatics</source>
          <year>2006</year>
          <volume>7</volume>
          <fpage>91</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-7-91"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2105-7-91</pub-id>
          <pub-id pub-id-type="medline">16504092</pub-id>
          <pub-id pub-id-type="pii">1471-2105-7-91</pub-id>
          <pub-id pub-id-type="pmcid">PMC1397873</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Qi</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Random forest for bioinformatics</article-title>
          <source>Ensemble Mach Learn</source>
          <year>2012</year>
          <fpage>307</fpage>
          <lpage>323</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cs.cmu.edu/~qyj/papersA08/11-rfbook.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zeiler</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>ADADELTA: An adaptive learning rate method</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on December 22, 2012. <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://tinyurl.com/5623evb6">http://tinyurl.com/5623evb6</ext-link></comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bergstra</surname>
              <given-names>DY</given-names>
            </name>
            <collab>James</collab>
            <name name-style="western">
              <surname>Cox</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>HYPEROPT: A python library for optimizing the hyperparameters of machine learning algorithms</article-title>
          <year>2013</year>
          <conf-name>Proceedings of the 12th Python in Science Conference</conf-name>
          <conf-date>July 29-August 2, 2013</conf-date>
          <conf-loc>Austin, TX</conf-loc>
          <pub-id pub-id-type="doi">10.25080/Majora-8b375195-003</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kingma</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ba</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Adam: a method for stochastic optimization</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on December 22, 2014.  <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/pdf/1412.6980.pdf"/></comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bi</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Goodman</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Kaminsky</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lessler</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>What is machine learning? A primer for the epidemiologist</article-title>
          <source>Am J Epidemiol</source>
          <year>2019</year>
          <volume>188</volume>
          <issue>12</issue>
          <fpage>2222</fpage>
          <lpage>2239</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academic.oup.com/aje/article/188/12/2222/5567515?login=false"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/aje/kwz189</pub-id>
          <pub-id pub-id-type="medline">31509183</pub-id>
          <pub-id pub-id-type="pii">5567515</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greener</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Kandathil</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Moffat</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>DT</given-names>
            </name>
          </person-group>
          <article-title>A guide to machine learning for biologists</article-title>
          <source>Nat Rev Mol Cell Biol</source>
          <year>2022</year>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>40</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1038/s41580-021-00407-0</pub-id>
          <pub-id pub-id-type="medline">34518686</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41580-021-00407-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Asch</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Machine learning and prediction in medicine—beyond the peak of inflated expectations</article-title>
          <source>N Engl J Med</source>
          <year>2017</year>
          <volume>376</volume>
          <issue>26</issue>
          <fpage>2507</fpage>
          <lpage>2509</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28657867"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMp1702071</pub-id>
          <pub-id pub-id-type="medline">28657867</pub-id>
          <pub-id pub-id-type="pmcid">PMC5953825</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stiglic</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Viner</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Effects of screentime on the health and well-being of children and adolescents: a systematic review of reviews</article-title>
          <source>BMJ Open</source>
          <year>2019</year>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>e023191</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=30606703"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2018-023191</pub-id>
          <pub-id pub-id-type="medline">30606703</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2018-023191</pub-id>
          <pub-id pub-id-type="pmcid">PMC6326346</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fletcher</surname>
              <given-names>RR</given-names>
            </name>
            <name name-style="western">
              <surname>Chamberlain</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Richman</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Oreskovic</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Taveras</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Wearable sensor and algorithm for automated measurement of screen time</article-title>
          <year>2016</year>
          <conf-name>2016 IEEE Wireless Health (WH)</conf-name>
          <conf-date>October 25-27, 2016</conf-date>
          <conf-loc>Bethesda, MD</conf-loc>
          <fpage>1</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1109/WH.2016.7764564</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Debelee</surname>
              <given-names>TG</given-names>
            </name>
            <name name-style="western">
              <surname>Schwenker</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ibenthal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yohannes</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Survey of deep learning in breast cancer image analysis</article-title>
          <source>Evol Syst</source>
          <year>2019</year>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>143</fpage>
          <lpage>163</lpage>
          <pub-id pub-id-type="doi">10.1007/s12530-019-09297-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Explanation in artificial intelligence: insights from the social sciences</article-title>
          <source>Artif Intell</source>
          <year>2019</year>
          <volume>267</volume>
          <fpage>1</fpage>
          <lpage>38</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/pii/S0004370218305988?via%3Dihub"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.artint.2018.07.007</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doshi-Velez</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Towards a rigorous science of interpretable machine learning</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on February 28, 2017. <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1702.08608"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1702.08608</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levin</surname>
              <given-names>KA</given-names>
            </name>
          </person-group>
          <article-title>Study design v. case-control studies</article-title>
          <source>Evid Based Dent</source>
          <year>2006</year>
          <volume>7</volume>
          <issue>3</issue>
          <fpage>83</fpage>
          <lpage>84</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nature.com/articles/6400436"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sj.ebd.6400436</pub-id>
          <pub-id pub-id-type="medline">17003803</pub-id>
          <pub-id pub-id-type="pii">6400436</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rockhill</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Willett</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Manson</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Leitzmann</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Stampfer</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hunter</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Colditz</surname>
              <given-names>GA</given-names>
            </name>
          </person-group>
          <article-title>Physical activity and mortality: a prospective study among women</article-title>
          <source>Am J Public Health</source>
          <year>2001</year>
          <volume>91</volume>
          <issue>4</issue>
          <fpage>578</fpage>
          <lpage>583</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ajph.aphapublications.org/doi/abs/10.2105/AJPH.91.4.578"/>
          </comment>
          <pub-id pub-id-type="doi">10.2105/ajph.91.4.578</pub-id>
          <pub-id pub-id-type="medline">11291369</pub-id>
          <pub-id pub-id-type="pmcid">PMC1446638</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cowie</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Eberhardt</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Sociodemographic characteristics of persons with diabetes</article-title>
          <source>Diabetes in America. 2nd Edition</source>
          <year>1995</year>
          <publisher-loc>Bethesda, MD</publisher-loc>
          <publisher-name>National Institute of Diabetes and Digestive and Kidney Diseases</publisher-name>
          <fpage>85</fpage>
          <lpage>116</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wager</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Athey</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Estimation and inference of heterogeneous treatment effects using random forests</article-title>
          <source>J Am Stat Assoc</source>
          <year>2018</year>
          <volume>113</volume>
          <issue>523</issue>
          <fpage>1228</fpage>
          <lpage>1242</lpage>
          <pub-id pub-id-type="doi">10.1080/01621459.2017.1319839</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Estimating the confidence interval for prediction errors of support vector machine classifiers</article-title>
          <source>J Mach Learn Res</source>
          <year>2008</year>
          <volume>9</volume>
          <fpage>521</fpage>
          <lpage>540</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/volume9/jiang08a/jiang08a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arbach</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Reinhardt</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bennett</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Fallouh</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Mammographic masses classification: comparison between Backpropagation Neural Network (BNN), K Nearest Neighbors (KNN), and human readers</article-title>
          <year>2003</year>
          <conf-name>CCECE 2003—Canadian Conference on Electrical and Computer Engineering. Toward a Caring and Humane Technology (Cat. No.03CH37436)</conf-name>
          <conf-date>May 4-7, 2003</conf-date>
          <conf-loc>Montreal, QC</conf-loc>
          <fpage>1441</fpage>
          <lpage>1444</lpage>
          <pub-id pub-id-type="doi">10.1109/ccece.2003.1226174</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hernan</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Robins</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Causal inference</article-title>
          <source>GRASS (Grup de Recerca en Anàlisi eStadística de la Supervivència)</source>
          <year>2010</year>
          <access-date>2024-01-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://grass.upc.edu/en/seminar/presentation-files/causal-inference/chapters-1-i-2/@@download/file/BookHernanRobinsCap1_2.pdf">https://grass.upc.edu/en/seminar/presentation-files/causal-inference/chapters-1-i-2/@@download/file/BookHernanRobinsCap1_2.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Imbens</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Rubin</surname>
              <given-names>DB</given-names>
            </name>
          </person-group>
          <source>Causal Inference for Statistics, Social, and Biomedical Sciences: An Introduction</source>
          <year>2015</year>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>Cambridge University Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Künzel</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Sekhon</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Bickel</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Metalearners for estimating heterogeneous treatment effects using machine learning</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2019</year>
          <volume>116</volume>
          <issue>10</issue>
          <fpage>4156</fpage>
          <lpage>4165</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.pnas.org/doi/abs/10.1073/pnas.1804597116?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.1804597116</pub-id>
          <pub-id pub-id-type="medline">30770453</pub-id>
          <pub-id pub-id-type="pii">1804597116</pub-id>
          <pub-id pub-id-type="pmcid">PMC6410831</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>BK</given-names>
            </name>
            <name name-style="western">
              <surname>Lessler</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stuart</surname>
              <given-names>EA</given-names>
            </name>
          </person-group>
          <article-title>Improving propensity score weighting using machine learning</article-title>
          <source>Stat Med</source>
          <year>2010</year>
          <volume>29</volume>
          <issue>3</issue>
          <fpage>337</fpage>
          <lpage>346</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/19960510"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/sim.3782</pub-id>
          <pub-id pub-id-type="medline">19960510</pub-id>
          <pub-id pub-id-type="pmcid">PMC2807890</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Propensity score and proximity matching using random forest</article-title>
          <source>Contemp Clin Trials</source>
          <year>2016</year>
          <volume>47</volume>
          <fpage>85</fpage>
          <lpage>92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26706666"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cct.2015.12.012</pub-id>
          <pub-id pub-id-type="medline">26706666</pub-id>
          <pub-id pub-id-type="pii">S1551-7144(15)30143-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC4818178</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ngom</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Data integration in machine learning</article-title>
          <year>2015</year>
          <conf-name>2015 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)</conf-name>
          <conf-date>November 9-12, 2015</conf-date>
          <conf-loc>Washington, DC</conf-loc>
          <fpage>1665</fpage>
          <lpage>1671</lpage>
          <pub-id pub-id-type="doi">10.1109/bibm.2015.7359925</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>FX</given-names>
            </name>
            <name name-style="western">
              <surname>Ngom</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A review on machine learning principles for multi-view biological data integration</article-title>
          <source>Brief Bioinform</source>
          <year>2018</year>
          <volume>19</volume>
          <issue>2</issue>
          <fpage>325</fpage>
          <lpage>340</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academic.oup.com/bib/article/19/2/325/2664338?login=false"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bib/bbw113</pub-id>
          <pub-id pub-id-type="medline">28011753</pub-id>
          <pub-id pub-id-type="pii">2664338</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>How to calculate sample size in randomized controlled trial?</article-title>
          <source>J Thorac Dis</source>
          <year>2009</year>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>51</fpage>
          <lpage>54</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22263004"/>
          </comment>
          <pub-id pub-id-type="medline">22263004</pub-id>
          <pub-id pub-id-type="pmcid">PMC3256489</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Carley</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Harrison</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>An introduction to power and sample size estimation</article-title>
          <source>Emerg Med J</source>
          <year>2003</year>
          <volume>20</volume>
          <issue>5</issue>
          <fpage>453</fpage>
          <lpage>458</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://emj.bmj.com/lookup/pmidlookup?view=long&#38;pmid=12954688"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/emj.20.5.453</pub-id>
          <pub-id pub-id-type="medline">12954688</pub-id>
          <pub-id pub-id-type="pmcid">PMC1726174</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vapnik</surname>
              <given-names>VN</given-names>
            </name>
          </person-group>
          <source>The Nature of Statistical Learning Theory</source>
          <year>1999</year>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perlich</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Provost</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Simonoff</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Tree induction vs. logistic regression: a learning-curve analysis</article-title>
          <source>J Mach Learn Res</source>
          <year>2003</year>
          <volume>4</volume>
          <fpage>211</fpage>
          <lpage>255</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/volume4/perlich03a/perlich03a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beleites</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Neugebauer</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Bocklitz</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Krafft</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Popp</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Sample size planning for classification models</article-title>
          <source>Anal Chim Acta</source>
          <year>2013</year>
          <volume>760</volume>
          <fpage>25</fpage>
          <lpage>33</lpage>
          <pub-id pub-id-type="doi">10.1016/j.aca.2012.11.007</pub-id>
          <pub-id pub-id-type="medline">23265730</pub-id>
          <pub-id pub-id-type="pii">S0003-2670(12)01647-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kandel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Plaisant</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kennedy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>van Ham</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Riche</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Weaver</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Brodbeck</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Buono</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Research directions in data wrangling: visualizations and transformations for usable and credible data</article-title>
          <source>Inf Vis</source>
          <year>2011</year>
          <volume>10</volume>
          <issue>4</issue>
          <fpage>271</fpage>
          <lpage>288</lpage>
          <pub-id pub-id-type="doi">10.1177/1473871611415994</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jerez</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Molina</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>García-Laencina</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Alba</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ribelles</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Martín</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Franco</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Missing data imputation using statistical and machine learning methods in a real breast cancer problem</article-title>
          <source>Artif Intell Med</source>
          <year>2010</year>
          <volume>50</volume>
          <issue>2</issue>
          <fpage>105</fpage>
          <lpage>115</lpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2010.05.002</pub-id>
          <pub-id pub-id-type="medline">20638252</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(10)00067-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pierson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Yau</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>ZIFA: dimensionality reduction for zero-inflated single-cell gene expression analysis</article-title>
          <source>Genome Biol</source>
          <year>2015</year>
          <volume>16</volume>
          <fpage>241</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://genomebiology.biomedcentral.com/articles/10.1186/s13059-015-0805-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13059-015-0805-z</pub-id>
          <pub-id pub-id-type="medline">26527291</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13059-015-0805-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC4630968</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>CY</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>YC</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>YH</given-names>
            </name>
          </person-group>
          <article-title>The optimal machine learning-based missing data imputation for the cox proportional hazard model</article-title>
          <source>Front Public Health</source>
          <year>2021</year>
          <volume>9</volume>
          <fpage>680054</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34291028"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpubh.2021.680054</pub-id>
          <pub-id pub-id-type="medline">34291028</pub-id>
          <pub-id pub-id-type="pmcid">PMC8289437</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stekhoven</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bühlmann</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>MissForest--non-parametric missing value imputation for mixed-type data</article-title>
          <source>Bioinformatics</source>
          <year>2012</year>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>112</fpage>
          <lpage>118</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academic.oup.com/bioinformatics/article/28/1/112/219101?login=false"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btr597</pub-id>
          <pub-id pub-id-type="medline">22039212</pub-id>
          <pub-id pub-id-type="pii">btr597</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gilpin</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Bau</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>BZ</given-names>
            </name>
            <name name-style="western">
              <surname>Bajwa</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Specter</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kagal</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Explaining explanations: an overview of interpretability of machine learning</article-title>
          <year>2018</year>
          <conf-name>2018 IEEE 5th International Conference on Data Science and Advanced Analytics (DSAA)</conf-name>
          <conf-date>October 01-03, 2018</conf-date>
          <conf-loc>Turin, Italy</conf-loc>
          <fpage>80</fpage>
          <lpage>89</lpage>
          <pub-id pub-id-type="doi">10.1109/dsaa.2018.00018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rui</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Boey</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Armstrong</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>An explainable machine learning model for predicting in-hospital amputation rate of patients with diabetic foot ulcer</article-title>
          <source>Int Wound J</source>
          <year>2022</year>
          <volume>19</volume>
          <issue>4</issue>
          <fpage>910</fpage>
          <lpage>918</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34520110"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/iwj.13691</pub-id>
          <pub-id pub-id-type="medline">34520110</pub-id>
          <pub-id pub-id-type="pmcid">PMC9013600</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Raschka</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Model evaluation, model selection, and algorithm selection in machine learning</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on November 13, 2018. <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1811.12808"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saeb</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lonini</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jayaraman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mohr</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Kording</surname>
              <given-names>KP</given-names>
            </name>
          </person-group>
          <article-title>The need to approximate the use-case in clinical machine learning</article-title>
          <source>Gigascience</source>
          <year>2017</year>
          <volume>6</volume>
          <issue>5</issue>
          <fpage>1</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28327985"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/gigascience/gix019</pub-id>
          <pub-id pub-id-type="medline">28327985</pub-id>
          <pub-id pub-id-type="pii">3071704</pub-id>
          <pub-id pub-id-type="pmcid">PMC5441397</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Phung</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tran</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rana</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Karmakar</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shilton</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yearwood</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dimitrova</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>TB</given-names>
            </name>
            <name name-style="western">
              <surname>Venkatesh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Berk</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Guidelines for developing and reporting machine learning predictive models in biomedical research: a multidisciplinary view</article-title>
          <source>J Med Internet Res</source>
          <year>2016</year>
          <volume>18</volume>
          <issue>12</issue>
          <fpage>e323</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2016/12/e323/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.5870</pub-id>
          <pub-id pub-id-type="medline">27986644</pub-id>
          <pub-id pub-id-type="pii">v18i12e323</pub-id>
          <pub-id pub-id-type="pmcid">PMC5238707</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peat</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Mellis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Xuan</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <source>Health Science Research: A Handbook of Quantitative Methods</source>
          <year>2020</year>
          <publisher-loc>London, UK</publisher-loc>
          <publisher-name>Routledge</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Woodward</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>Epidemiology: Study Design and Data Analysis, 3rd Edition</source>
          <year>2013</year>
          <publisher-loc>Boca Raton, FL</publisher-loc>
          <publisher-name>CRC press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pallmann</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bedding</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Choodari-Oskooei</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Dimairo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Flight</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hampson</surname>
              <given-names>LV</given-names>
            </name>
            <name name-style="western">
              <surname>Holmes</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mander</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Odondi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sydes</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Villar</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Wason</surname>
              <given-names>JMS</given-names>
            </name>
            <name name-style="western">
              <surname>Weir</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wheeler</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Yap</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jaki</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Adaptive designs in clinical trials: why use them, and how to run and report them</article-title>
          <source>BMC Med</source>
          <year>2018</year>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>29</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedicine.biomedcentral.com/articles/10.1186/s12916-018-1017-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12916-018-1017-7</pub-id>
          <pub-id pub-id-type="medline">29490655</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12916-018-1017-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC5830330</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Shami</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>On hyperparameter optimization of machine learning algorithms: theory and practice</article-title>
          <source>Neurocomputing</source>
          <year>2020</year>
          <volume>415</volume>
          <fpage>295</fpage>
          <lpage>316</lpage>
          <pub-id pub-id-type="doi">10.1016/j.neucom.2020.07.061</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on October 11, 2018. <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1810.04805"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vaswani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shazeer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Parmar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Uszkoreit</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gomez</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Polosukhin</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Guyon</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Von Luxburg</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Bengio</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wallach</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Fergus</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Vishwanathan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Garnett</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Attention is all you need</article-title>
          <source>Advances in Neural Information Processing Systems 30 (NIPS 2017)</source>
          <year>2017</year>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>Curran Associates</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Radford</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Narasimhan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Salimans</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Improving language understanding by generative pre-training</article-title>
          <source>Papers With Code</source>
          <year>2018</year>
          <access-date>2024-01-19</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://paperswithcode.com/paper/improving-language-understanding-by">https://paperswithcode.com/paper/improving-language-understanding-by</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rasmy</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhi</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Med-BERT: pretrained contextualized embeddings on large-scale structured electronic health records for disease prediction</article-title>
          <source>NPJ Digit Med</source>
          <year>2021</year>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>86</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-021-00455-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-021-00455-y</pub-id>
          <pub-id pub-id-type="medline">34017034</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-021-00455-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC8137882</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Beltagy</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Lo</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Cohan</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>SciBERT: a pretrained language model for scientific text</article-title>
          <year>2019</year>
          <conf-name>Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP)</conf-name>
          <conf-date>November 3–7, 2019</conf-date>
          <conf-loc>Hong Kong, China</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>3615</fpage>
          <lpage>3620</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/D19-1371.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/d19-1371</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krizhevsky</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Hinton</surname>
              <given-names>GE</given-names>
            </name>
          </person-group>
          <article-title>ImageNet classification with deep convolutional neural networks</article-title>
          <source>Commun ACM</source>
          <year>2017</year>
          <volume>6</volume>
          <issue>6</issue>
          <fpage>84</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="doi">10.1145/3065386</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Socher</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fei-Fei</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>ImageNet: a large-scale hierarchical image database</article-title>
          <year>2009</year>
          <conf-name>2009 IEEE Conference on Computer Vision and Pattern Recognition</conf-name>
          <conf-date>June 20-25, 2009</conf-date>
          <conf-loc>Miami, FL</conf-loc>
          <fpage>248</fpage>
          <lpage>255</lpage>
          <pub-id pub-id-type="doi">10.1109/cvpr.2009.5206848</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Anwar</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Majid</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Qayyum</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Awais</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Alnowami</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>MK</given-names>
            </name>
          </person-group>
          <article-title>Medical image analysis using convolutional neural networks: a review</article-title>
          <source>J Med Syst</source>
          <year>2018</year>
          <volume>42</volume>
          <issue>11</issue>
          <fpage>226</fpage>
          <pub-id pub-id-type="doi">10.1007/s10916-018-1088-1</pub-id>
          <pub-id pub-id-type="medline">30298337</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10916-018-1088-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Khoshgoftaar</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A survey of transfer learning</article-title>
          <source>J Big Data</source>
          <year>2016</year>
          <volume>3</volume>
          <fpage>9</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journalofbigdata.springeropen.com/articles/10.1186/s40537-016-0043-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s40537-016-0043-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Libbrecht</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Noble</surname>
              <given-names>WS</given-names>
            </name>
          </person-group>
          <article-title>Machine learning applications in genetics and genomics</article-title>
          <source>Nat Rev Genet</source>
          <year>2015</year>
          <volume>16</volume>
          <issue>6</issue>
          <fpage>321</fpage>
          <lpage>332</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25948244"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/nrg3920</pub-id>
          <pub-id pub-id-type="medline">25948244</pub-id>
          <pub-id pub-id-type="pii">nrg3920</pub-id>
          <pub-id pub-id-type="pmcid">PMC5204302</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nicholls</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>John</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Watson</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Munroe</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Barnes</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Cabrera</surname>
              <given-names>CP</given-names>
            </name>
          </person-group>
          <article-title>Reaching the end-game for GWAS: machine learning approaches for the prioritization of complex disease loci</article-title>
          <source>Front Genet</source>
          <year>2020</year>
          <volume>11</volume>
          <fpage>350</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32351543"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fgene.2020.00350</pub-id>
          <pub-id pub-id-type="medline">32351543</pub-id>
          <pub-id pub-id-type="pmcid">PMC7174742</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Huss</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Abid</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mohammadi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Torkamani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Telenti</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A primer on deep learning in genomics</article-title>
          <source>Nat Genet</source>
          <year>2019</year>
          <volume>51</volume>
          <issue>1</issue>
          <fpage>12</fpage>
          <lpage>18</lpage>
          <pub-id pub-id-type="doi">10.1038/s41588-018-0295-5</pub-id>
          <pub-id pub-id-type="medline">30478442</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41588-018-0295-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eraslan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Avsec</surname>
              <given-names>Ž</given-names>
            </name>
            <name name-style="western">
              <surname>Gagneur</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Theis</surname>
              <given-names>FJ</given-names>
            </name>
          </person-group>
          <article-title>Deep learning: new computational modelling techniques for genomics</article-title>
          <source>Nat Rev Genet</source>
          <year>2019</year>
          <volume>20</volume>
          <issue>7</issue>
          <fpage>389</fpage>
          <lpage>403</lpage>
          <pub-id pub-id-type="doi">10.1038/s41576-019-0122-6</pub-id>
          <pub-id pub-id-type="medline">30971806</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41576-019-0122-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ung</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>CS</given-names>
            </name>
          </person-group>
          <article-title>Unsupervised feature construction and knowledge extraction from genome-wide assays of breast cancer with denoising autoencoders</article-title>
          <source>Pac Symp Biocomput</source>
          <year>2015</year>
          <volume>20</volume>
          <fpage>132</fpage>
          <lpage>143</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://psb.stanford.edu/psb-online/proceedings/psb15/abstracts/2015_p132.html"/>
          </comment>
          <pub-id pub-id-type="medline">25592575</pub-id>
          <pub-id pub-id-type="pii">9789814644730_0014</pub-id>
          <pub-id pub-id-type="pmcid">PMC4299935</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Van der Maaten</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hinton</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Visualizing data using t-SNE</article-title>
          <source>J Mach Learn Res</source>
          <year>2008</year>
          <volume>9</volume>
          <fpage>2579</fpage>
          <lpage>2605</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/volume9/vandermaaten08a/vandermaaten08a.pdf?fbcl"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zeleznik</surname>
              <given-names>OA</given-names>
            </name>
            <name name-style="western">
              <surname>Thallinger</surname>
              <given-names>GG</given-names>
            </name>
            <name name-style="western">
              <surname>Kuster</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gholami</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Culhane</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>Dimension reduction techniques for the integrative analysis of multi-omics data</article-title>
          <source>Brief Bioinform</source>
          <year>2016</year>
          <volume>17</volume>
          <issue>4</issue>
          <fpage>628</fpage>
          <lpage>641</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26969681"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bib/bbv108</pub-id>
          <pub-id pub-id-type="medline">26969681</pub-id>
          <pub-id pub-id-type="pii">bbv108</pub-id>
          <pub-id pub-id-type="pmcid">PMC4945831</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grutters</surname>
              <given-names>JPC</given-names>
            </name>
            <name name-style="western">
              <surname>Sculpher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Briggs</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Severens</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Candel</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Stahl</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>De Ruysscher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Boer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ramaekers</surname>
              <given-names>BLT</given-names>
            </name>
            <name name-style="western">
              <surname>Joore</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Acknowledging patient heterogeneity in economic evaluation: a systematic literature review</article-title>
          <source>Pharmacoeconomics</source>
          <year>2013</year>
          <volume>31</volume>
          <issue>2</issue>
          <fpage>111</fpage>
          <lpage>123</lpage>
          <pub-id pub-id-type="doi">10.1007/s40273-012-0015-4</pub-id>
          <pub-id pub-id-type="medline">23329430</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Rush</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kosorok</surname>
              <given-names>MR</given-names>
            </name>
          </person-group>
          <article-title>Estimating individualized treatment rules using outcome weighted learning</article-title>
          <source>J Am Stat Assoc</source>
          <year>2012</year>
          <volume>107</volume>
          <issue>449</issue>
          <fpage>1106</fpage>
          <lpage>1118</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23630406"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/01621459.2012.695674</pub-id>
          <pub-id pub-id-type="medline">23630406</pub-id>
          <pub-id pub-id-type="pmcid">PMC3636816</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tsiatis</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Laber</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Davidian</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A robust method for estimating optimal treatment regimes</article-title>
          <source>Biometrics</source>
          <year>2012</year>
          <volume>68</volume>
          <issue>4</issue>
          <fpage>1010</fpage>
          <lpage>1018</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22550953"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1541-0420.2012.01763.x</pub-id>
          <pub-id pub-id-type="medline">22550953</pub-id>
          <pub-id pub-id-type="pmcid">PMC3556998</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Laber</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Tsiatis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Davidian</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Using decision lists to construct interpretable and parsimonious treatment regimes</article-title>
          <source>Biometrics</source>
          <year>2015</year>
          <volume>71</volume>
          <issue>4</issue>
          <fpage>895</fpage>
          <lpage>904</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26193819"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/biom.12354</pub-id>
          <pub-id pub-id-type="medline">26193819</pub-id>
          <pub-id pub-id-type="pmcid">PMC4715597</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Athey</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wager</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Efficient policy learning</article-title>
          <source>Stanford Institute for Economic Policy Research (SIEPR)</source>
          <year>2017</year>
          <access-date>2024-01-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://siepr.stanford.edu/publications/working-paper/efficient-policy-learning">https://siepr.stanford.edu/publications/working-paper/efficient-policy-learning</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Almirall</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Nahum-Shani</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Sherwood</surname>
              <given-names>NE</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>Introduction to SMART designs for the development of adaptive interventions: with application to weight loss research</article-title>
          <source>Transl Behav Med</source>
          <year>2014</year>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>260</fpage>
          <lpage>274</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25264466"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s13142-014-0265-0</pub-id>
          <pub-id pub-id-type="medline">25264466</pub-id>
          <pub-id pub-id-type="pii">265</pub-id>
          <pub-id pub-id-type="pmcid">PMC4167891</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kosorok</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Moodie</surname>
              <given-names>EE</given-names>
            </name>
          </person-group>
          <source>Adaptive Treatment Strategies in Practice: Planning Trials and Analyzing Data for Personalized Medicine</source>
          <year>2015</year>
          <publisher-loc>Philadelphia, PA</publisher-loc>
          <publisher-name>Society for Industrial and Applied Mathematics</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chakraborty</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>Dynamic treatment regimes</article-title>
          <source>Annu Rev Stat Appl</source>
          <year>2014</year>
          <volume>1</volume>
          <fpage>447</fpage>
          <lpage>464</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25401119"/>
          </comment>
          <pub-id pub-id-type="doi">10.1146/annurev-statistics-022513-115553</pub-id>
          <pub-id pub-id-type="medline">25401119</pub-id>
          <pub-id pub-id-type="pmcid">PMC4231831</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>YQ</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Laber</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Kosorok</surname>
              <given-names>MR</given-names>
            </name>
          </person-group>
          <article-title>New statistical learning methods for estimating optimal dynamic treatment regimes</article-title>
          <source>J Am Stat Assoc</source>
          <year>2015</year>
          <volume>110</volume>
          <issue>510</issue>
          <fpage>583</fpage>
          <lpage>598</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26236062"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/01621459.2014.937488</pub-id>
          <pub-id pub-id-type="medline">26236062</pub-id>
          <pub-id pub-id-type="pmcid">PMC4517946</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tsiatis</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Laber</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Davidian</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Robust estimation of optimal dynamic treatment regimes for sequential treatment decisions</article-title>
          <source>Biometrika</source>
          <year>2013</year>
          <volume>100</volume>
          <issue>3</issue>
          <fpage>681</fpage>
          <lpage>684</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24302771"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/biomet/ast014</pub-id>
          <pub-id pub-id-type="medline">24302771</pub-id>
          <pub-id pub-id-type="pmcid">PMC3843953</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref88">
        <label>88</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Laber</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Davidian</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tsiatis</surname>
              <given-names>AA</given-names>
            </name>
          </person-group>
          <article-title>Interpretable dynamic treatment regimes</article-title>
          <source>J Am Stat Assoc</source>
          <year>2018</year>
          <volume>113</volume>
          <issue>524</issue>
          <fpage>1541</fpage>
          <lpage>1549</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30774169"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/01621459.2017.1345743</pub-id>
          <pub-id pub-id-type="medline">30774169</pub-id>
          <pub-id pub-id-type="pmcid">PMC6373443</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref89">
        <label>89</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Song</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lou</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Salvage treatment with apatinib for advanced non-small-cell lung cancer</article-title>
          <source>Onco Targets Ther</source>
          <year>2017</year>
          <volume>10</volume>
          <fpage>1821</fpage>
          <lpage>1825</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28367065"/>
          </comment>
          <pub-id pub-id-type="doi">10.2147/OTT.S113435</pub-id>
          <pub-id pub-id-type="medline">28367065</pub-id>
          <pub-id pub-id-type="pii">ott-10-1821</pub-id>
          <pub-id pub-id-type="pmcid">PMC5370069</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref90">
        <label>90</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lei</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Nahum-Shani</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Lynch</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Oslin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>A "SMART" design for building individualized treatment sequences</article-title>
          <source>Annu Rev Clin Psychol</source>
          <year>2012</year>
          <volume>8</volume>
          <fpage>21</fpage>
          <lpage>48</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/22224838"/>
          </comment>
          <pub-id pub-id-type="doi">10.1146/annurev-clinpsy-032511-143152</pub-id>
          <pub-id pub-id-type="medline">22224838</pub-id>
          <pub-id pub-id-type="pmcid">PMC3887122</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref91">
        <label>91</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tejedor</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Woldaregay</surname>
              <given-names>AZ</given-names>
            </name>
            <name name-style="western">
              <surname>Godtliebsen</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Reinforcement learning application in diabetes blood glucose control: a systematic review</article-title>
          <source>Artif Intell Med</source>
          <year>2020</year>
          <volume>104</volume>
          <fpage>101836</fpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2020.101836</pub-id>
          <pub-id pub-id-type="medline">32499004</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(18)30454-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref92">
        <label>92</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nahum-Shani</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Spring</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Witkiewitz</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tewari</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>Just-in-Time Adaptive Interventions (JITAIs) in mobile health: key components and design principles for ongoing health behavior support</article-title>
          <source>Ann Behav Med</source>
          <year>2018</year>
          <volume>52</volume>
          <issue>6</issue>
          <fpage>446</fpage>
          <lpage>462</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27663578"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s12160-016-9830-8</pub-id>
          <pub-id pub-id-type="medline">27663578</pub-id>
          <pub-id pub-id-type="pii">10.1007/s12160-016-9830-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC5364076</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref93">
        <label>93</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luckett</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Laber</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Kahkoska</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Maahs</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer-Davis</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kosorok</surname>
              <given-names>MR</given-names>
            </name>
          </person-group>
          <article-title>Estimating dynamic treatment regimes in mobile health using V-learning</article-title>
          <source>J Am Stat Assoc</source>
          <year>2020</year>
          <volume>115</volume>
          <issue>530</issue>
          <fpage>692</fpage>
          <lpage>706</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32952236"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/01621459.2018.1537919</pub-id>
          <pub-id pub-id-type="medline">32952236</pub-id>
          <pub-id pub-id-type="pmcid">PMC7500510</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref94">
        <label>94</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Letai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fisher</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Flaherty</surname>
              <given-names>KT</given-names>
            </name>
          </person-group>
          <article-title>Precision medicine for cancer with next-generation functional diagnostics</article-title>
          <source>Nat Rev Cancer</source>
          <year>2015</year>
          <volume>15</volume>
          <issue>12</issue>
          <fpage>747</fpage>
          <lpage>756</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26536825"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/nrc4015</pub-id>
          <pub-id pub-id-type="medline">26536825</pub-id>
          <pub-id pub-id-type="pii">nrc4015</pub-id>
          <pub-id pub-id-type="pmcid">PMC4970460</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref95">
        <label>95</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schiebinger</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>AI can be sexist and racist—it's time to make it fair</article-title>
          <source>Nature</source>
          <year>2018</year>
          <volume>559</volume>
          <issue>7714</issue>
          <fpage>324</fpage>
          <lpage>326</lpage>
          <pub-id pub-id-type="doi">10.1038/d41586-018-05707-8</pub-id>
          <pub-id pub-id-type="medline">30018439</pub-id>
          <pub-id pub-id-type="pii">10.1038/d41586-018-05707-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref96">
        <label>96</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mehrabi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Morstatter</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Saxena</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lerman</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Galstyan</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A survey on bias and fairness in machine learning</article-title>
          <source>ACM Comput Surv</source>
          <year>2021</year>
          <volume>54</volume>
          <issue>6</issue>
          <fpage>1</fpage>
          <lpage>35</lpage>
          <pub-id pub-id-type="doi">10.1145/3457607</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref97">
        <label>97</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Corbett-Davies</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gaebler</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Nilforoshan</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Shroff</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Goel</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The measure and mismeasure of fairness: a critical review of fair machine learning</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on July 31, 2018. <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1808.00023"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1808.00023</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref98">
        <label>98</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Larrazabal</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Nieto</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Milone</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrante</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Gender imbalance in medical imaging datasets produces biased classifiers for computer-aided diagnosis</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2020</year>
          <volume>117</volume>
          <issue>23</issue>
          <fpage>12592</fpage>
          <lpage>12594</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.pnas.org/doi/abs/10.1073/pnas.1919012117?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.1919012117</pub-id>
          <pub-id pub-id-type="medline">32457147</pub-id>
          <pub-id pub-id-type="pii">1919012117</pub-id>
          <pub-id pub-id-type="pmcid">PMC7293650</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref99">
        <label>99</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wolf</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Debut</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sanh</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chaumond</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Delangue</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Moi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cistac</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rault</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Louf</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Funtowicz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Davison</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shleifer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>von Platen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jernite</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Plu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Scao</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Gugger</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Drame</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lhoest</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Rush</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Transformers: state-of-the-art natural language processing</article-title>
          <year>2020</year>
          <conf-name>Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing: System Demonstrations</conf-name>
          <conf-date>November 16-20, 2020</conf-date>
          <conf-loc>Virtual</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>38</fpage>
          <lpage>45</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/2020.emnlp-demos.6/"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/2020.emnlp-demos.6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref100">
        <label>100</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhuang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Qi</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Duan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Xi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xiong</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>A comprehensive survey on transfer learning</article-title>
          <source>Proc IEEE</source>
          <year>2021</year>
          <volume>109</volume>
          <issue>1</issue>
          <fpage>43</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.1109/jproc.2020.3004555</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref101">
        <label>101</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaelbling</surname>
              <given-names>LP</given-names>
            </name>
            <name name-style="western">
              <surname>Littman</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>AW</given-names>
            </name>
          </person-group>
          <article-title>Reinforcement learning: a survey</article-title>
          <source>J Artif Intell Res</source>
          <year>1996</year>
          <volume>4</volume>
          <fpage>237</fpage>
          <lpage>285</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jair.org/index.php/jair/article/view/10166"/>
          </comment>
          <pub-id pub-id-type="doi">10.1613/jair.301</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref102">
        <label>102</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nemati</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Reinforcement learning in healthcare: a survey</article-title>
          <source>ACM Comput Surv</source>
          <year>2021</year>
          <volume>55</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>36</lpage>
          <pub-id pub-id-type="doi">10.1145/3477600</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref103">
        <label>103</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gottesman</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Johansson</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Komorowski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Faisal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sontag</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Doshi-Velez</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
          </person-group>
          <article-title>Guidelines for reinforcement learning in healthcare</article-title>
          <source>Nat Med</source>
          <year>2019</year>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>16</fpage>
          <lpage>18</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://hdl.handle.net/10044/1/65646"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41591-018-0310-5</pub-id>
          <pub-id pub-id-type="medline">30617332</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-018-0310-5</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
