<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v26i1e54616</article-id>
      <article-id pub-id-type="pmid">39178403</article-id>
      <article-id pub-id-type="doi">10.2196/54616</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>AI-Driven Diagnostic Assistance in Medical Inquiry: Reinforcement Learning Algorithm Development and Validation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Ma</surname>
            <given-names>Simone</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Lee</surname>
            <given-names>Hyeonhoon</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Tillmann</surname>
            <given-names>Taavi</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Zou</surname>
            <given-names>Xuan</given-names>
          </name>
          <degrees>MM</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0001-9018-002X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>He</surname>
            <given-names>Weijie</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5523-1039</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>Yu</given-names>
          </name>
          <degrees>ME</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5465-4574</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Ouyang</surname>
            <given-names>Yi</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5987-451X</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Zhen</given-names>
          </name>
          <degrees>MM</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0007-6716-9053</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>Yu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0453-5662</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>Yongsheng</given-names>
          </name>
          <degrees>BMed</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-1390-6585</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Feng</surname>
            <given-names>Lili</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7166-2867</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>Sheng</given-names>
          </name>
          <degrees>BMed</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0362-9894</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Mengqi</given-names>
          </name>
          <degrees>BE</degrees>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0005-8228-4565</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Xuyan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6468-3611</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author">
          <name name-style="western">
            <surname>Zheng</surname>
            <given-names>Yefeng</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2195-2847</ext-link>
        </contrib>
        <contrib id="contrib13" contrib-type="author">
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>Rui</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <xref rid="aff8" ref-type="aff">8</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7533-3753</ext-link>
        </contrib>
        <contrib id="contrib14" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Ting</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Department of Computer Science and Technology</institution>
            <institution>Tsinghua University</institution>
            <addr-line>Room 3-609, Future Internet Technology Research Center</addr-line>
            <addr-line>Tsinghua University</addr-line>
            <addr-line>Beijing, 100084</addr-line>
            <country>China</country>
            <phone>86 010 62797101</phone>
            <email>tingchen@tsinghua.edu.cn</email>
          </address>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3228-9166</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Shenzhen Center for Disease Control and Prevention</institution>
        <addr-line>Shenzhen</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Computer Science and Technology</institution>
        <institution>Tsinghua University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Institute of Artificial Intelligence</institution>
        <institution>Tsinghua University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Beijing National Research Center for Information Science and Technology</institution>
        <institution>Tsinghua University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Jarvis Research Center</institution>
        <institution>Tencent YouTu Lab</institution>
        <addr-line>Shenzhen</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Beijing Tsinghua Changgung Hospital</institution>
        <institution>School of Clinical Medicine</institution>
        <institution>Tsinghua University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Tencent Healthcare</institution>
        <addr-line>Shenzhen</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff8">
        <label>8</label>
        <institution>Department of Automation</institution>
        <institution>Tsinghua University</institution>
        <addr-line>Beijing</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Ting Chen <email>tingchen@tsinghua.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>23</day>
        <month>8</month>
        <year>2024</year>
      </pub-date>
      <volume>26</volume>
      <elocation-id>e54616</elocation-id>
      <history>
        <date date-type="received">
          <day>17</day>
          <month>11</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>14</day>
          <month>3</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>13</day>
          <month>4</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>4</day>
          <month>7</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Xuan Zou, Weijie He, Yu Huang, Yi Ouyang, Zhen Zhang, Yu Wu, Yongsheng Wu, Lili Feng, Sheng Wu, Mengqi Yang, Xuyan Chen, Yefeng Zheng, Rui Jiang, Ting Chen. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 23.08.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2024/1/e54616" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>For medical diagnosis, clinicians typically begin with a patient’s chief concerns, followed by questions about symptoms and medical history, physical examinations, and requests for necessary auxiliary examinations to gather comprehensive medical information. This complex medical investigation process has yet to be modeled by existing artificial intelligence (AI) methodologies.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of this study was to develop an AI-driven medical inquiry assistant for clinical diagnosis that provides inquiry recommendations by simulating clinicians’ medical investigating logic via reinforcement learning.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We compiled multicenter, deidentified outpatient electronic health records from 76 hospitals in Shenzhen, China, spanning the period from July to November 2021. These records consisted of both unstructured textual information and structured laboratory test results. We first performed feature extraction and standardization using natural language processing techniques and then used a reinforcement learning actor-critic framework to explore the rational and effective inquiry logic. To align the inquiry process with actual clinical practice, we segmented the inquiry into 4 stages: inquiring about symptoms and medical history, conducting physical examinations, requesting auxiliary examinations, and terminating the inquiry with a diagnosis. External validation was conducted to validate the inquiry logic of the AI model.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>This study focused on 2 retrospective inquiry-and-diagnosis tasks in the emergency and pediatrics departments. The emergency departments provided records of 339,020 consultations including mainly children (median age 5.2, IQR 2.6-26.1 years) with various types of upper respiratory tract infections (250,638/339,020, 73.93%). The pediatrics department provided records of 561,659 consultations, mainly of children (median age 3.8, IQR 2.0-5.7 years) with various types of upper respiratory tract infections (498,408/561,659, 88.73%). When conducting its own inquiries in both scenarios, the AI model demonstrated high diagnostic performance, with areas under the receiver operating characteristic curve of 0.955 (95% CI 0.953-0.956) and 0.943 (95% CI 0.941-0.944), respectively. When the AI model was used in a simulated collaboration with physicians, it notably reduced the average number of physicians’ inquiries to 46% (6.037/13.26; 95% CI 6.009-6.064) and 43% (6.245/14.364; 95% CI 6.225-6.269) while achieving areas under the receiver operating characteristic curve of 0.972 (95% CI 0.970-0.973) and 0.968 (95% CI 0.967-0.969) in the scenarios. External validation revealed a normalized Kendall τ distance of 0.323 (95% CI 0.301-0.346), indicating the inquiry consistency of the AI model with physicians.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This retrospective analysis of predominantly respiratory pediatric presentations in emergency and pediatrics departments demonstrated that an AI-driven diagnostic assistant had high diagnostic performance both in stand-alone use and in simulated collaboration with clinicians. Its investigation process was found to be consistent with the clinicians’ medical investigation logic. These findings highlight the diagnostic assistant’s promise in assisting the decision-making processes of health care professionals.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>inquiry and diagnosis</kwd>
        <kwd>electronic health record</kwd>
        <kwd>reinforcement learning</kwd>
        <kwd>natural language processing</kwd>
        <kwd>artificial intelligence</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The growing demand for intelligent clinical decision support systems (CDSSs) has become increasingly evident in the health care landscape today [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. The surge in demand can be attributed to advances in medical knowledge, the accumulation of health care data, and the rapid progression of artificial intelligence (AI) and machine learning technologies. Traditionally, health care professionals have relied heavily on their individual experiences and medical expertise to make clinical decisions, which are often susceptible to subjective biases and information gaps [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Furthermore, the world faces challenges related to insufficient medical resources, particularly in regions where a shortage of health care professionals impedes timely access to care. Consequently, intelligent CDSSs have been developed with the potential to enhance patient care quality, reduce medical costs, and minimize diagnostic errors. These systems were developed by analyzing and training data from electronic health records (EHRs) and medical literature [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>] using the power of extensive data analysis, machine learning algorithms, and natural language processing techniques.</p>
        <p>Our research is focused on advancing CDSSs with a primary emphasis on aiding the diagnostic process before the diagnosis is made, specifically during the information-gathering phase. Existing diagnostic support systems often rely on comprehensive patient information, such as EHRs and medical images [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref13">13</xref>], to provide diagnostic predictions only at the final step of the medical investigation process. Thus, the vital need for decision support during the intermediate steps of the diagnostic process is largely overlooked. The clinical diagnostic process is a complex procedure that involves a series of inquiries and examinations. In this dynamic process, health care professionals continuously gather information, adjust hypotheses, and refine diagnostic reasoning until the optimal diagnosis and treatment are determined. The process is not merely a sequence of isolated steps but a dynamic and evolving interaction between the clinician and the patient. Conventional diagnostic support systems tend to provide little to no guidance during these intermediate steps, falling short of providing meaningful support when it is most needed.</p>
        <p>A variety of automatic disease diagnosis techniques have emerged recently as a result of the advancement of AI with the goal of assisting in the middle stages of clinical decision-making [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref21">21</xref>]. However, a common limitation among these methods is their exclusive focus on online disease diagnosis. Online health care platforms have undoubtedly revolutionized medical consultations by facilitating remote access to health care professionals. Patients can seek advice and preliminary assessments for various ailments without visiting a health care facility physically. Unfortunately, there are inherent constraints to these platforms. Online consultations are primarily reliant on textual descriptions, making it challenging to gather essential information that requires palpation, auscultation, or specialized laboratory investigations, which collectively form the foundation of a comprehensive and accurate diagnosis.</p>
        <p>Large language models (LLMs) such as ChatGPT [<xref ref-type="bibr" rid="ref22">22</xref>] have demonstrated remarkable proficiency in following instructions and generating humanlike responses across various domains. LLMs have already attracted a lot of attention regarding their potential applications in health care settings, which include facilitating clinical documentation, summarizing research papers, assisting with medical education [<xref ref-type="bibr" rid="ref23">23</xref>], or acting as a chatbot to respond to questions from patients about their specific concerns [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. While LLMs have access to extremely large corpora containing medical dialogues, knowledge bases, and the literature, there is a significant gap in access to large-scale real patient records [<xref ref-type="bibr" rid="ref26">26</xref>]. This lack of actual clinical data significantly impacts their ability to provide tailored inquiry recommendations for patients in varying clinical scenarios. In addition, ethical [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>] and security [<xref ref-type="bibr" rid="ref27">27</xref>] concerns further complicate the incorporation of sensitive health records into the training of LLMs.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>To address the gap in diagnostic decision support, we present MedRIA, a medical reinforcement learning inquiry assistant. MedRIA is designed to facilitate the medical investigation process by intelligently guiding inquiries; symptom assessments; examination recommendations; and, in particular, the transitions between them. To the best of our knowledge, no previous system has successfully managed the entire diagnostic process. MedRIA learns its inquiry capabilities from a large number of processed EHRs. MedRIA uses a reinforcement learning actor-critic framework [<xref ref-type="bibr" rid="ref28">28</xref>] to explore rational and effective inquiry logic. Following the standard inquiry process of physicians [<xref ref-type="bibr" rid="ref29">29</xref>], we segmented the inquiry into 4 stages: inquiring about symptoms and medical history, conducting physical examinations (PEs), requesting auxiliary examinations (AEs), and terminating the inquiry with a diagnosis. MedRIA’s ability to tailor inquiry strategies according to patient-specific conditions positions it as a promising solution for regions or populations facing constraints in medical resources.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Processed Outpatient EHRs</title>
        <p>The Shenzhen Center for Disease Control and Prevention in Guangdong Province, China, collected deidentified outpatient EHRs from 76 hospitals in Shenzhen. We selected records of the emergency and pediatrics departments from July 2021 to November 2021. As depicted in <xref rid="figure1" ref-type="fig">Figure 1</xref>, these records consist of both unstructured textual information and structured laboratory test results, which underwent feature extraction and standardization using natural language processing techniques. An example of a processed EHR is provided on the right side of <xref rid="figure1" ref-type="fig">Figure 1</xref>.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Schematic illustration of the data collection, data processing, and task building process for the development of MedRIA. ADHD: attention-deficit/hyperactivity disorder; EHR: electronic health record.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e54616_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>By combining established medical terminologies with domain-specific knowledge from health care professionals, we constructed a comprehensive feature set for the feature extraction process. Initially, we used existing Chinese versions of general medical terminologies, including the <italic>International Classification of Diseases, 10th Revision</italic>, and Systematized Nomenclature of Medicine–Clinical Terms. In addition, we incorporated domain expertise by consulting with health care experts to identify relevant clinical concepts and terminology to the context of our study. The feature sets of the emergency and pediatrics EHRs are presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendices 1</xref> and <xref ref-type="supplementary-material" rid="app2">2</xref>, respectively.</p>
        <p>As depicted in <xref rid="figure1" ref-type="fig">Figure 1</xref>, after extracting features from clinical text and standardizing test forms, each record was converted into a feature set, where each feature was categorized into 1 of 3 types based on its source—symptom and medical history (SMH), PE, and AE—and assigned a value based on its data type. Symptom features (eg, <italic>cough</italic>) and some features observed from examinations (eg, <italic>throat congestion</italic> and <italic>proteinuria</italic>) were assigned binary values indicating whether the patient exhibited that feature. Numerical laboratory test features with specific reference ranges, such as <italic>platelet count</italic>, were categorized as high, low, or within the reference range. The values of descriptive features depend on their meanings. For example, <italic>urine color</italic> was given values such as <italic>yellow</italic>, <italic>colorless</italic>, <italic>white</italic>, <italic>red</italic>, and so on.</p>
        <p>In our study, we used the Medical Bidirectional Encoder Representations From Transformers (MedBERT) model for feature extraction on clinical text, which was based on Bidirectional Encoder Representations From Transformers [<xref ref-type="bibr" rid="ref30">30</xref>]. Using a vast corpus of Chinese clinical text data, including medical textbooks, online consultations, journal article abstracts, and deidentified EHRs, we pretrained the Bidirectional Encoder Representations From Transformers model to obtain MedBERT. We manually constructed 2 labeled data sets to fine-tune MedBERT to perform medical named entity recognition and entity normalization. In our pipeline, we first used fine-tuned MedBERT for medical named entity recognition on clinical text. Next, we proceeded to normalize the identified entities to our predefined feature set using the fine-tuned MedBERT for entity normalization. Finally, we used a string-matching negation detection mechanism to determine the values of binary features based on the contents of the text. For structured laboratory test results, we used a string-matching algorithm to standardize the test items to our predefined feature set. The feature values could be directly obtained from the structured results.</p>
        <p>Following the feature extraction process, we conducted data cleaning and filtering. Details are presented in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref> [<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]. Finally, we filtered the data sets by department, creating 2 retrospective inquiry-and-diagnosis evaluation tasks for emergency and pediatrics. Emergency and pediatrics are the 2 busiest departments in hospitals and often put tremendous pressure on health care personnel. These departments require effective decision support tools to assist health care professionals in managing the workload efficiently while providing timely and accurate patient care.</p>
      </sec>
      <sec>
        <title>Reinforcement Learning Formulation</title>
        <p>MedRIA takes as initial input the patient’s basic demographic information, including gender and age, along with features extracted from the patient’s chief concerns. Subsequently, MedRIA provides recommendations for the physician to inquire about specific features. As the physician conducts the inquiry and gathers patient information, MedRIA updates the patient’s status and continues to output the next relevant feature or suggests terminating the inquiry and providing a predicted diagnosis in terms of the probability distribution over potential disease diagnoses. This can be described as a Markov decision process [<xref ref-type="bibr" rid="ref38">38</xref>], represented by the tuple <italic>M</italic>(<italic>S</italic>, <italic>A</italic>, <italic>T</italic>, <italic>R</italic>, <italic>γ</italic>). Here, <italic>S</italic> (state) is a set of vectors representing the inquiry states that incorporate both observed and unobserved features so far, denoted as x<sub>O</sub> and x<sub>U</sub>, respectively. <italic>A</italic> (action) involves the actions available to MedRIA, including recommending specific features or suggesting the termination of the inquiry process. The goal is to determine the optimal inquiry strategy composed of a series of actions, denoted as π<sub>θ</sub>. At each step t, the policy π<sub>θ</sub>(a<sub>t</sub>&#124;s<sub>t</sub>) determines the action a<sub>t</sub> based on the current state s<sub>t</sub>. The transition function <italic>T</italic> represents the probability distribution of the next state s<sub>t+1</sub> given the current state s<sub>t</sub> and action a<sub>t</sub>, denoted as p(s<sub>t+1</sub>&#124;s<sub>t</sub>, a<sub>t</sub>). <italic>R</italic> is a reward function used to assess the benefit of the transition (s<sub>t</sub>, a<sub>t</sub>, s<sub>t+1</sub>). <italic>γ</italic> is the discount factor for accumulating rewards at each step. The state-value function that reinforcement learning maximizes is the expected sum of discounted rewards given the policy π<sub>θ</sub> and the state s<sub>t</sub>.</p>
      </sec>
      <sec>
        <title>Actor-Critic Framework</title>
        <p>MedRIA uses the classic reinforcement learning actor-critic framework [<xref ref-type="bibr" rid="ref28">28</xref>] involving 2 neural networks: the actor and the critic. The actor network determines the next action to take, whereas the critic network is responsible for providing feedback to the actor, evaluating the quality of actions and suggesting adjustments. On the basis of our previous work [<xref ref-type="bibr" rid="ref39">39</xref>], we used a pretrained variational autoencoder (VAE) [<xref ref-type="bibr" rid="ref31">31</xref>] as the backbone of the actor network. We used a supervised diagnostic prediction model, denoted as <italic>D</italic>, to provide the current disease prediction probability distribution <italic>D</italic>(s<sub>t</sub>) based on the state s<sub>t</sub> to help decide on each inquiry action.</p>
        <p>The actor of MedRIA makes decisions for the next action based on the observed features x<sub>O</sub>. It is intuitive to prioritize asking about feature x that has a high conditional probability p(x&#124;x<sub>O</sub>). We leveraged the VAE to incorporate the conditional probability distribution between observed features x<sub>O</sub> and unobserved features x<sub>U</sub>. A VAE defines a generative model of the form p(x, z)=∏<sub>i</sub> p<sub>Θ</sub>(x<sub>i</sub>&#124;z)p(z), where features x are generated from latent variables z. The number of dimensions of z is 64. p(z) represents a prior, often a spherical Gaussian distribution. p<sub>Θ</sub>(x&#124;z) is represented by a 4-layer multilayer perceptron (MLP) decoder with parameters Θ. The VAE uses another neural network encoder with parameters Φ to generate the variational approximation of the posterior q<sub>Φ</sub>(z&#124;x). To obtain p(x<sub>U</sub>&#124;x<sub>O</sub>), we sampled ẑ from the VAE encoder as ẑ~q<sub>Φ</sub>(z&#124;x) and then sampled x<sub>U</sub> from the VAE decoder as p<sub>Θ</sub>(x<sub>U</sub>&#124;ẑ). Let e<sub>i</sub> represent the embedding vector for the ith observed feature x<sub>i</sub>, and let c<sub>i</sub>=[x<sub>i</sub>, e<sub>i</sub>] denote the concatenated input carrying information for x<sub>i</sub>. The number of dimensions of e<sub>i</sub> is 64. Then, we used a 4-layer MLP to map the input c<sub>i</sub> to a Gaussian distribution in latent space, with mean vector μ<sub>i</sub> and variance vector V<sub>i</sub>. To address arbitrary partial observations of features during the inquiry process, we used a product-of-experts mechanism [<xref ref-type="bibr" rid="ref40">40</xref>] to calculate the approximate posterior. The VAE was incorporated within the actor network to leverage the conditional probability distribution p(x<sub>U</sub>&#124;x<sub>O</sub>). To obtain the action a<sub>t</sub>, x<sub>O</sub> were first fed into the nested VAE, yielding decoded features that contain predictive information regarding x<sub>U</sub>. The decoded features were then concatenated with the current diagnostic confidence <italic>D</italic>(s<sub>t</sub>) and the representation of the current timestep n<sub>t</sub>. Here, n<sub>t</sub>=t / N<sub>T</sub> represents the ratio of the number of completed inquiries t over a predefined maximum action count N<sub>T</sub>. N<sub>T</sub> was set to 21 and 26 for the emergency and pediatrics tasks, respectively. Finally, a 2-layer MLP with softmax activation was used to map the concatenated vector to the action space.</p>
        <p>The objective of the critic is to estimate the state-value function to optimize the policy π<sub>θ</sub>. Similar to the approach used in the actor, we concatenated the current state s<sub>t</sub> with <italic>D</italic>(s<sub>t</sub>) and n<sub>t</sub> to form an input vector to aid in estimation. In addition, we obtained the informative latent variable z<sub>t</sub> by feeding observed features x<sub>O</sub> into the VAE encoder and appended z<sub>t</sub> to the input vector. Ultimately, a 5-layer MLP was used to map the input vector to predict the state value.</p>
      </sec>
      <sec>
        <title>Reward Shaping</title>
        <p>The reward function for evaluating the gain in state transition plays a crucial role in the reinforcement learning process. We start by defining the short-term reward function <italic>R</italic><sub>short</sub> when the action is to inquire about a specific feature x. For MedRIA, the inquiry states can be categorized into 4 ordered stages: SMH (S<sub>SMH</sub>), PE (S<sub>PE</sub>), AE (S<sub>AE</sub>), and termination with diagnosis (S<sub>TD</sub>). During the inquiry process, there can be multiple states that fall under each stage. For example, the initial state of MedRIA falls under S<sub>SMH</sub>, followed by a sequence of states that fall under S<sub>PE</sub>, and so on. Correspondingly, all features are categorized according to the 3 inquiry stages S<sub>SMH</sub>, S<sub>PE</sub>, and S<sub>AE</sub>. When MedRIA selects a feature that falls under a particular inquiry stage, it signifies a transition from the inquiry stage to that stage. We ensure that MedRIA’s inquiry process adheres to the sequential nature of clinical inquiries, where features from previous stages are not considered for selection once the inquiry progresses to a subsequent stage. This is achieved by manually setting the probabilities of actions associated with features from previous stages to 0 in the action probability distribution of the actor.</p>
        <p>To measure the consistency of MedRIA’s inquiries with those made by physicians, we introduce 3 functions: M<sub>SMH</sub>(s<sub>t</sub>), M<sub>PE</sub>(s<sub>t</sub>), and M<sub>AE</sub>(s<sub>t</sub>). These functions quantify the number of features that physicians have inquired about in the current state s<sub>t</sub> but that MedRIA has not investigated. Specifically, M<sub>SMH</sub>(s<sub>t</sub>), M<sub>PE</sub>(s<sub>t</sub>), and M<sub>AE</sub>(s<sub>t</sub>) quantify the number of SMH features, PE features, and AE features, respectively. When calculating M<sub>AE</sub>(s<sub>t</sub>), all features within a laboratory test are considered as a unit. Essentially, M<sub>AE</sub>(s<sub>t</sub>) calculates the number of AEs that physicians have recommended in the current state s<sub>t</sub> but that MedRIA has omitted. Correspondingly, when MedRIA selects a feature associated with an AE, it indicates that MedRIA has recommended the entire examination.</p>
        <p>To assess the diagnostic quality of inquiries, we define a function Diff(s<sub>t</sub>, x, s<sub>t+1</sub>) to estimate the differential effect of querying the feature x in the transition from state s<sub>t</sub> to state s<sub>t+1</sub>. If x belongs to the extracted features, meaning that the physician also inquired about that feature from the patient, then Diff(s<sub>t</sub>, x, s<sub>t+1</sub>) is defined as Diff(s<sub>t</sub>, x, s<sub>t+1</sub>)=&#124;D<sub>KL</sub>[y&#124;&#124;<italic>D</italic>(s<sub>t</sub>)]-D<sub>KL</sub>[y&#124;&#124;<italic>D</italic>(s<sub>t+1</sub>)]&#124;, where D<sub>KL</sub> is the Kullback-Leibler divergence between 2 distributions and y is a one-hot vector indicating the final diagnosis made by the physician. The absolute difference between these 2 Kullback-Leibler divergences represents the degree to which the feature x influences the diagnosis results, with the final diagnosis made by the physician as the reference. If x does not belong to the extracted features, then Diff(s<sub>t</sub>, x, s<sub>t+1</sub>) is simply set to 0. Subsequently, we define the short-term reward function <italic>R</italic><sub>short</sub>(s<sub>t</sub>, x, s<sub>t+1</sub>) as follows: when s<sub>t</sub> belongs to S<sub>SMH</sub> and s<sub>t+1</sub> belongs to S<sub>PE</sub>, <italic>R</italic><sub>short</sub>(s<sub>t</sub>, x, s<sub>t+1</sub>)=Diff(s<sub>t</sub>, x, s<sub>t+1</sub>)+α·I<sub>phy</sub>(x)-m·M<sub>SMH</sub>(s<sub>t</sub>); when s<sub>t</sub> belongs to S<sub>SMH</sub> and s<sub>t+1</sub> belongs to S<sub>AE</sub>, <italic>R</italic><sub>short</sub>(s<sub>t</sub>, x, s<sub>t+1</sub>)=Diff(s<sub>t</sub>, x, s<sub>t+1</sub>)+α·I<sub>phy</sub>(x)-m·(M<sub>SMH</sub>(s<sub>t</sub>)+M<sub>PE</sub>(s<sub>t</sub>)); when s<sub>t</sub> belongs to S<sub>PE</sub> and s<sub>t+1</sub> belongs to S<sub>AE,</sub> <italic>R</italic><sub>short</sub>(s<sub>t</sub>, x, s<sub>t+1</sub>)=Diff(s<sub>t</sub>, x, s<sub>t+1</sub>)+α·I<sub>phy</sub>(x)-m·M<sub>AE</sub>(s<sub>t</sub>); otherwise, <italic>R</italic><sub>short</sub>(s<sub>t</sub>, x, s<sub>t+1</sub>)=Diff(s<sub>t</sub>, x, s<sub>t+1</sub>)+α·I<sub>phy</sub>(x). I<sub>phy</sub>(x) is an indicator representing whether feature x belongs to the extracted features. If yes, it takes the value of 1; otherwise, it is 0. α and m are small constant factors to balance terms in the expression. We set α to 0.2. m was set to 0.2 in the emergency task and 0.3 in the pediatrics task. In <italic>R</italic><sub>short</sub>, we penalize each hasty stage transition based on the number of features that the actual physician inquired about from the patient in the previous stage but were not inquired about by MedRIA.</p>
        <p>Next, we elaborate on the definition of the long-term reward <italic>R</italic><sub>long</sub> for the action of terminating the inquiry. When MedRIA selects the action to stop the inquiry process, if the disease predicted by the diagnostic model <italic>D</italic> matches the physician’s diagnosis, <italic>R</italic><sub>long</sub> is set to 2 in the emergency task and 3 in the pediatrics task. If it does not match, similar to the penalty of inquiry consistency in <italic>R</italic><sub>short</sub>, we define <italic>R</italic><sub>long</sub>(s<sub>t</sub>, x, s<sub>t+1</sub>) as follows: when s<sub>t</sub> belongs to S<sub>SMH</sub>, <italic>R</italic><sub>long</sub>(s<sub>t</sub>, x, s<sub>t+1</sub>)=-m·(M<sub>SMH</sub>(s<sub>t</sub>)+M<sub>PE</sub>(s<sub>t</sub>)+M<sub>AE</sub>(s<sub>t</sub>)); when s<sub>t</sub> belongs to S<sub>PE</sub>, <italic>R</italic><sub>long</sub>(s<sub>t</sub>, x, s<sub>t+1</sub>)=-m·(M<sub>PE</sub>(s<sub>t</sub>)+M<sub>AE</sub>(s<sub>t</sub>)); when s<sub>t</sub> belongs to S<sub>AE</sub>, <italic>R</italic><sub>long</sub>(s<sub>t</sub>, x, s<sub>t+1</sub>)=-m·M<sub>AE</sub>(s<sub>t</sub>).</p>
      </sec>
      <sec>
        <title>Training Details</title>
        <p>During the training process of MedRIA, we first trained a VAE. In particular, we simulated the arbitrary partial observations during the inquiry process by randomly dropping a portion of input features. Next, we trained a diagnostic prediction model <italic>D</italic> based on a 5-layer MLP using the softmax function and cross-entropy loss function. Then, we initialized the parameters of the nested VAE in the actor network of MedRIA with the parameters of the trained VAE. Only the nested VAE decoder was fine-tuned in the follow-up training. We used the proximal policy optimization [<xref ref-type="bibr" rid="ref32">32</xref>] algorithm to train both the actor and critic networks. To make the predicted diagnostic probability distribution more accurate when dealing with the partially observed features generated by MedRIA, we collected the observed features x<sub>O</sub> when the actor chose to terminate the inquiry process during each training epoch. At the end of each epoch, collected data were used to fine-tune <italic>D</italic> to better adapt to MedRIA’s inquiry patterns. More details on implementation are presented in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
      </sec>
      <sec>
        <title>External Validation</title>
        <p>We used data from the medical dialogue corpus, IMCS-21 [<xref ref-type="bibr" rid="ref41">41</xref>], to assess MedRIA’s inquiry logic. IMCS-21 contains 4116 online medical consultations between physicians and patients covering 10 pediatric diseases. After data filtering, we selected 950 consultations with clear diagnoses that overlapped with 4 diseases covered in our pediatrics task: bronchitis (286 consultations), acute upper respiratory tract infection (392 consultations), indigestion (233 consultations), and bronchopneumonia (39 consultations). This data set served as an external test set for the trained pediatric MedRIA. We constructed ordered inquiry sequences based on the dialogue contents. These inquiry sequences reflected the typical order of feature queries in the diagnostic process, and they were used to evaluate MedRIA’s inquiry sequences. If MedRIA’s inquiry sequences are similar to those of physicians, we can conclude that MedRIA’s inquiry logic is similar to that of physicians. The similarity is measured by the Kendall τ distance, which treats an inquiry sequence as a permutation of features and quantifies the pairwise disagreements between 2 permutations. In addition, we applied the normalized Kendall τ distance, which scales the Kendall τ distance by the total number of possible feature pairs.</p>
      </sec>
      <sec>
        <title>Statistical Analysis</title>
        <p>Nonparametric bootstrap sampling was used to calculate a 95% CI. Specifically, we repeatedly drew 1000 bootstrap samples from the test set. Each bootstrap sample was obtained through random sampling with replacement and has the same size as the test set.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>All EHR data used in this study were retrospectively collected from EHR systems sourced from routine clinical practice. To ensure patient privacy and confidentiality, all data were deidentified. This study was approved by the ethics committees of the Shenzhen Center for Disease Control and Prevention (SZCDC-IRB2024055). As this study involved no direct patient intervention and was retrospective in nature, individual informed consent was waived.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Data Characteristics</title>
        <p>We focused on 2 retrospective inquiry-and-diagnosis evaluation tasks in the emergency and pediatrics departments. The emergency departments provided 339,020 records, and the pediatrics departments provided 561,659 records. We randomly split the data into 3 parts: 75% for training MedRIA, 10% for validation, and 15% for testing.</p>
        <p>The emergency EHRs contained 862 features, including 42.8% (369/862) SMH features, 21.2% (183/862) PE features, and 36% (310/862) AE features. There were 18 diagnosed diseases. As some records had 2 diagnosed diseases, we classified each combination as a separate disease category, bringing the total number of distinct diagnoses to 23. Similarly, the pediatrics EHRs covered 793 features, including 44.3% (351/793) SMH features, 22.6% (179/793) PE features, and 33.2% (263/793) AE features. There were 18 diagnosed diseases. When combinations of diagnosed diseases were considered, the total number of different diagnoses increased to 23. The detailed data characteristics are presented in <xref ref-type="table" rid="table1">Tables 1</xref> and <xref ref-type="table" rid="table2">2</xref>.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Characteristics of the data in the emergency task (N=339,020).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="660"/>
            <col width="310"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Characteristics</td>
                <td>Values</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Gender, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td>187,992 (55.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>151,028 (44.5)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Age (years), median (IQR)</td>
                <td>5.2 (2.6-26.1)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Diagnosis, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AURTI<sup>a</sup></td>
                <td>93,594 (27.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bronchitis</td>
                <td>93,564 (27.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bronchitis with rhinitis</td>
                <td>2439 (0.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AURTI with bronchitis</td>
                <td>4923 (1.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bronchopneumonia</td>
                <td>3833 (1.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Laryngopharyngitis</td>
                <td>6095 (1.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pharyngitis</td>
                <td>24,146 (7.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AURTI with pharyngitis</td>
                <td>2639 (0.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pharyngitis with bronchitis</td>
                <td>3564 (1.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Herpangina</td>
                <td>7604 (2.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Tonsillitis</td>
                <td>10,286 (3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AURTI with tonsillitis</td>
                <td>1784 (0.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Gastroenteritis</td>
                <td>30,385 (9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Gastritis</td>
                <td>10,142 (3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Enteritis</td>
                <td>2690 (0.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Acute appendicitis</td>
                <td>1957 (0.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Urinary tract stones</td>
                <td>13,884 (4.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Urethritis</td>
                <td>4052 (1.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Dermatitis</td>
                <td>6239 (1.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Acute urticaria</td>
                <td>5597 (1.7)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hand-foot-and-mouth disease</td>
                <td>2990 (0.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hypertension</td>
                <td>4397 (1.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Lumbar disc herniation</td>
                <td>2216 (0.7)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>AURTI: acute upper respiratory tract infection.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Characteristics of the data in the pediatrics task (N=561,659).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="670"/>
            <col width="300"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Characteristics</td>
                <td>Values</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Gender, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td>315,074 (56.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>246,585 (43.9)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Age (years), median (IQR)</td>
                <td>3.8 (2.0-5.7)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Diagnosis, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bronchitis</td>
                <td>209,918 (37.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AURTI<sup>a</sup></td>
                <td>155,181 (27.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AURTI with bronchitis</td>
                <td>11,734 (2.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bronchopneumonia</td>
                <td>8119 (1.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bronchitis with bronchopneumonia</td>
                <td>2565 (0.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pharyngitis</td>
                <td>41,205 (7.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pharyngitis with bronchitis</td>
                <td>5232 (0.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AURTI with pharyngitis</td>
                <td>2859 (0.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Laryngopharyngitis</td>
                <td>11,909 (2.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Tonsillitis</td>
                <td>19,790 (3.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Herpangina</td>
                <td>15,647 (2.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Rhinitis</td>
                <td>14,824 (2.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bronchitis with rhinitis</td>
                <td>10,109 (1.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Gastroenteritis</td>
                <td>16,261 (2.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Gastritis</td>
                <td>5313 (0.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Enteritis</td>
                <td>3479 (0.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Indigestion</td>
                <td>8757 (1.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hand-foot-and-mouth disease</td>
                <td>5156 (0.9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Dermatitis</td>
                <td>3151 (0.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Acute urticaria</td>
                <td>2595 (0.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Developmental delay</td>
                <td>2953 (0.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hyperactivity</td>
                <td>2538 (0.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Precocious puberty</td>
                <td>2364 (0.4)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>AURTI: acute upper respiratory tract infection.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Evaluation Criteria</title>
        <p>We assessed the inquiry performance of MedRIA along 2 dimensions: the consistency of its inquiries with those of physicians and the contribution of its inquiries to diagnostic accuracy. It should be noted that physicians will inevitably make incorrect diagnoses, conduct inquiries based on individual previous experience, and record the EHRs in different ways. Therefore, we can establish a baseline diagnostic model by training a supervised classification model using the extracted feature sets as input and the physicians’ diagnoses as output. This model simulated the physicians’ diagnostic ability, and its performance approximates the actual performance of physicians. We aimed to mitigate the influence of individual physician variability and ensure a fair comparison between different inquiry methods based on the extracted feature sets. While the diagnoses in the records could serve as a gold standard, our simulated physician diagnostic model also serves as an important baseline. For training, several machine learning models were used, including logistic regression, random forest, support vector machine, MLP, and light gradient-boosting machine [<xref ref-type="bibr" rid="ref42">42</xref>]. We chose light gradient-boosting machine for the emergency task and random forest for the pediatrics task based on their performance on the validation set.</p>
        <p>To better evaluate the potential of MedRIA as a clinical assistant, we simulated a collaborative inquiry process between MedRIA and a physician. Specifically, MedRIA’s actor network would generate probability distributions for potential inquiry features based on the currently collected medical information. These distributions suggest several high-probability features for the physician to inquire about. The physician has the flexibility to accept and incorporate some or all of these suggestions into the inquiries. In addition, the physician can exercise their professional judgment to either ask additional questions or proceed to examination. In our simulated collaboration, we simplified this process by having MedRIA recommend only the feature with the highest probability at each step. If the inquiry features suggested by MedRIA were in agreement with part of the extracted feature set, it was assumed that the physician accepted the inquiry recommendations. Otherwise, if the suggested features were not found in the extracted feature set, the simulated physician would randomly select an unasked feature from the extracted features as the next inquiry question. This simplification represents a simplistic approximation of a less informed or junior physician’s behavior. It serves as a conservative estimate of MedRIA’s performance when collaborating with less experienced counterparts, reflecting a lower-bound performance of MedRIA-physician collaborative inquiry. <xref rid="figure2" ref-type="fig">Figure 2</xref> illustrates a vivid example of the simulated collaborative inquiry process.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Schematic illustration of the simulated collaborative inquiry process between a physician and MedRIA. AI: artificial intelligence.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e54616_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Inquiry Quality Analysis</title>
        <p><xref ref-type="table" rid="table3">Table 3</xref> illustrates the performance of MedRIA in the emergency and pediatrics tasks in terms of diagnosis accuracy and inquiry consistency. In the emergency task, physicians used an average of 13.26 (95% CI 13.202-13.317) inquiries to gather 19.488 (95% CI 19.361-19.618) features. This disparity in numbers is because a single inquiry related to a specific laboratory test can yield multiple features. For example, a complete blood count includes several features, such as lymphocyte percentage, platelet count, hemoglobin concentration, and so on. When MedRIA conducted its own inquiries, it averaged 14.24 (95% CI 14.2-14.284) inquiries, with 58% (8.253/14.24; 95% CI 8.212-8.297) of them matching the extracted features. It resulted in the acquisition of an average of 10.628 (95% CI 10.549-10.714) features, accounting for 55% (10.628/19.488) of all extracted features. In the pediatrics task, MedRIA performed, on average, 1.9 more inquiries (16.271, 95% CI 16.231-16.307) than physicians (14.364, 95% CI 14.322-14.404), with 60% (9.81/16.271; 95% CI 9.776-9.842) of them matching 64% (13.168/20.429; 95% CI 13.093-13.244) of all extracted features (20.429, 95% CI 20.338-20.513). When MedRIA collaborated with physicians, it recalled 95% (18.543/19.488; 95% CI 18.425-18.657) and 99% (20.168/20.429; 95% CI 20.080-20.251) of the extracted features in the emergency and pediatrics tasks, respectively. The simulated collaborative inquiry process required only an average of 12.648 (95% CI 12.602-12.696) and 14.146 (95% CI 14.106-14.182) inquiries, respectively, for the emergency and pediatrics tasks, both fewer than the number of inquiries made by physicians. With the assistance of MedRIA, we were able to reduce the number of inquiries made by physicians to 46% (6.037/13.26; 95% CI 6.009-6.064) and 43% (6.245/14.364; 95% CI 6.225-6.269) of those in independent inquiries while recovering nearly all the original inquiry records.</p>
        <p>We used multiple metrics to assess final diagnoses, including the area under the receiver operating characteristic curve (AUROC), macro–<italic>F</italic><sub>1</sub>-score, and accuracy. We also introduced a new metric called general accuracy, which considers both fully and partially correct diagnoses in accuracy calculation because health care professionals from different hospitals may have varying recording habits. A diagnosis was considered fully correct when the core diagnosis was recorded and partially correct when only a constituent element of the core diagnosis was recorded [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>]. As shown in <xref ref-type="table" rid="table3">Table 3</xref>, when MedRIA conducted its own inquiries in the emergency task, it achieved an AUROC (0.955, 95% CI 0.953-0.956) comparable to when it acquired complete extracted features (0.960, 95% CI 0.957-0.962) despite obtaining only 55% (10.628/19.488) of the extracted features. In the pediatrics task, MedRIA achieved a higher AUROC (0.943, 95% CI 0.941-0.944) with 64% (13.168/20.429) of the extracted features compared to using complete features (0.930, 95% CI 0.928-0.932). As shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>, MedRIA’s own inquiry and the collaborative inquiry in the emergency task significantly improved the AUROC of diagnostic predictions for acute appendicitis. Specifically, when compared to physicians’ inquiry, both MedRIA’s own inquiry and the collaborative inquiry demonstrated substantially lower false negative rates (equal to 1 minus true positive rates) at various false positive rate thresholds. These findings underscore the potential of MedRIA to significantly reduce diagnostic errors, particularly for critical conditions such as acute appendicitis in which even small increases in false negative rates may be unacceptable to patients and health system leaders.</p>
        <p>The collaborative inquiry and the physicians’ inquiry resulted in similar AUROCs for acute upper respiratory tract infections and bronchopneumonia. As shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>, MedRIA’s own inquiry resulted in a higher AUROC for rhinitis than the physicians’ inquiry in the pediatrics task but a lower AUROC for bronchitis and bronchopneumonia. For these 3 diseases, the collaborative inquiry yielded the highest AUROC. The complete receiver operating characteristic curves for all diseases are shown in Figures S1 and S2 in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. These results demonstrate that MedRIA understands the importance of inquiring about discriminative features that have a high diagnostic contribution, especially in the pediatrics task.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Performance of MedRIA in the emergency and pediatrics tasks.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="120"/>
            <col width="0"/>
            <col width="100"/>
            <col width="0"/>
            <col width="80"/>
            <col width="0"/>
            <col width="90"/>
            <col width="0"/>
            <col width="90"/>
            <col width="0"/>
            <col width="110"/>
            <col width="0"/>
            <col width="140"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="110"/>
            <thead>
              <tr valign="top">
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">AUROC<sup>a</sup> (95% CI)</td>
                <td colspan="2"><italic>F</italic><sub>1</sub>-score (95% CI)</td>
                <td colspan="2">General accuracy (95% CI)</td>
                <td colspan="2">Accuracy (95% CI)</td>
                <td colspan="2">Average number of inquiries (95% CI)</td>
                <td colspan="2">Average number of inquiries matching extracted features (95% CI)</td>
                <td colspan="2">Average number of inquiries conducted by physicians (95% CI)</td>
                <td>Average number of recalled features (95% CI)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="18">
                  <bold>Emergency</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physicians</td>
                <td colspan="2">0.96 (0.957-0.962)</td>
                <td colspan="2">0.63 (0.623-0.638)</td>
                <td colspan="2">0.853 (0.85-0.856)</td>
                <td colspan="2">0.744 (0.741-0.748)</td>
                <td colspan="2">13.26 (13.202-13.317)</td>
                <td colspan="2">13.26 (13.202-13.317)</td>
                <td colspan="2">13.26 (13.202-13.317)</td>
                <td colspan="2">19.488 (19.361-19.618)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MedRIA</td>
                <td colspan="2">0.955 (0.953-0.956)</td>
                <td colspan="2">0.538 (0.531-0.545)</td>
                <td colspan="2">0.806 (0.803-0.81)</td>
                <td colspan="2">0.684 (0.68-0.688)</td>
                <td colspan="2">14.24 (14.2-14.284)</td>
                <td colspan="2">8.253 (8.212-8.297)</td>
                <td colspan="2">0</td>
                <td colspan="2">10.628 (10.549-10.714)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Collaboration</td>
                <td colspan="2">0.972 (0.97-0.973)</td>
                <td colspan="2">0.646 (0.639-0.653)</td>
                <td colspan="2">0.854 (0.851-0.857)</td>
                <td colspan="2">0.746 (0.742-0.75)</td>
                <td colspan="2">12.648 (12.602-12.696)</td>
                <td colspan="2">12.648 (12.602-12.696)</td>
                <td colspan="2">6.037 (6.009-6.064)</td>
                <td colspan="2">18.543 (18.425-18.657)</td>
              </tr>
              <tr valign="top">
                <td colspan="18">
                  <bold>Pediatrics</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physicians</td>
                <td colspan="2">0.93 (0.928-0.932)</td>
                <td colspan="2">0.613 (0.608-0.618)</td>
                <td colspan="2">0.827 (0.825-0.83)</td>
                <td colspan="2">0.704 (0.701-0.708)</td>
                <td colspan="2">14.364 (14.322-14.404)</td>
                <td colspan="2">14.364 (14.322-14.404)</td>
                <td colspan="2">14.364 (14.322-14.404)</td>
                <td colspan="2">20.429 (20.338-20.513)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MedRIA</td>
                <td colspan="2">0.943 (0.941-0.944)</td>
                <td colspan="2">0.521 (0.514-0.527)</td>
                <td colspan="2">0.782 (0.779-0.784)</td>
                <td colspan="2">0.656 (0.653-0.66)</td>
                <td colspan="2">16.271 (16.231-16.307)</td>
                <td colspan="2">9.81 (9.776-9.842)</td>
                <td colspan="2">0</td>
                <td colspan="2">13.168 (13.093-13.244)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Collaboration</td>
                <td colspan="2">0.968 (0.967-0.969)</td>
                <td colspan="2">0.633 (0.627-0.638)</td>
                <td colspan="2">0.842 (0.839-0.844)</td>
                <td colspan="2">0.732 (0.729-0.735)</td>
                <td colspan="2">14.146 (14.106-14.182)</td>
                <td colspan="2">14.146 (14.106-14.182)</td>
                <td colspan="2">6.245 (6.225-6.269)</td>
                <td colspan="2">20.168 (20.08-20.251)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>AUROC: area under the receiver operating characteristic curve.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Receiver operating characteristic curves for 3 diseases in the emergency task. AUC: area under the curve; AURTI: acute upper respiratory tract infection.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e54616_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Receiver operating characteristic curves for 3 diseases in the pediatrics task. AUC: area under the curve.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e54616_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>MedRIA may conduct inquiries that were not asked by physicians, so they are excluded from the extracted features of patient EHRs. Hence, when MedRIA conducted its own inquiries, there was a varying degree of decline in all diagnostic metrics when compared to using complete extracted features. On the other hand, MedRIA obtained more information through the guidance of physicians when it collaborated with them. In the emergency task, the <italic>F</italic><sub>1</sub>-score (0.646, 95% CI 0.639-0.653) of diagnoses significantly improved. Both general accuracy (0.854, 95% CI 0.851-0.857) and accuracy (0.746, 95% CI 0.742-0.750) were comparable to those of physicians’ diagnoses. In the pediatrics task, collaborative inquiry led to a significant increase in <italic>F</italic><sub>1</sub>-score (0.633, 95% CI 0.627-0.638), general accuracy (0.842, 95% CI 0.839-0.844), and accuracy (0.732, 95% CI 0.729-0.735).</p>
        <p>Considering the high prevalence of respiratory diseases in our data set, we evaluated MedRIA’s performance on a more representative data set to show its generalizability. Specifically, we randomly discarded two-thirds of respiratory cases from the emergency data set and three-quarters from the pediatrics data set. The results are presented in Table S1 in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>. From these results, we can draw similar conclusions to those obtained from the experiments conducted on the complete data set.</p>
      </sec>
      <sec>
        <title>Inquiry Logic Analysis</title>
        <p><xref ref-type="table" rid="table4">Table 4</xref> provides the number of different types of positive recalled features, which refer to exhibited symptoms or laboratory test results showing out-of-range values. Collecting more positive features under the same number of inquiries often leads to more accurate diagnosis results [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]. In the pediatrics task, 36% (7.326/20.429; 95% CI 7.294-7.357) of the features collected by physicians were positive, and MedRIA’s own inquiries recalled 66% (4.852/7.326; 95% CI 4.825-4.877) of positive features. Specifically, it recalled 62% (1.665/2.692; 95% CI 1.654-1.675) of SMH features, 79% (2.24/2.837; 95% CI 2.23-2.25) of PE features, and 53% (0.948/1.797; 95% CI 0.931-0.965) of AE features. When MedRIA worked with physicians, the recall rates for all types of features were &#62;95%. Overall, we observed that MedRIA was capable of accurately identifying positive features that were not mentioned in the chief concerns of patients. This ability is crucial during the investigation process because patients may not always have sufficient medical knowledge to fully describe their health conditions.</p>
        <p><xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref> shows the top 10 physician inquiry features on patients diagnosed with pharyngitis in the emergency task and tonsillitis in the pediatrics task. We observed that MedRIA could accurately inquire about features obtained by physicians. <xref rid="figure5" ref-type="fig">Figures 5</xref> and <xref rid="figure6" ref-type="fig">6</xref> illustrate when these features were investigated by MedRIA and through collaborative investigation, respectively. First, we observed a clear distinction between when SMH and PE features were acquired, which is in line with our settings for MedRIA’s inquiry process. SMH features, including cough, runny nose, convulsions, and chills, were consistently acquired before the seventh step, whereas PE features, including pharyngeal congestion, enlarged tonsils, coarse breath sounds, rash, herpes, and hand and foot rash, were consistently acquired after the seventh step. We also noticed that consecutive steps of inquiries exhibited consistently high frequencies, allowing us to understand MedRIA’s inquiry logic clearly. For example, when conducting PEs, MedRIA began with pharyngeal congestion and enlarged tonsils followed by coarse breath sounds and rash. This logical sequence reflects a structured approach to differential diagnosis, ensuring a thorough evaluation of relevant symptoms and signs. Pharyngeal congestion and enlarged tonsils are pivotal features in the context of pharyngitis. Coarse breath sounds may suggest respiratory issues or lung conditions, whereas rash can be associated with a wide range of dermatological, allergic, or infectious disorders. As shown in <xref rid="figure5" ref-type="fig">Figures 5</xref> and <xref rid="figure6" ref-type="fig">6</xref>, when collaborating with physicians, the refinement of MedRIA’s inquiry logic is evident in the increased stability of determining which features to inquire about at each step. <xref ref-type="table" rid="table5">Table 5</xref> provides concrete examples of MedRIA’s inquiry sequences, where the aforementioned logic can be traced back. Figure S1 in <xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref> presents the tree diagram depicting the order of MedRIA’s inquiry features for 4 patients diagnosed with pharyngitis in the emergency task. These evidences demonstrate MedRIA’s coherent, stable, and well-reasoned inquiry logic. The characteristics of inquiry features for all diseases in both tasks are shown in Figures S1-S6 in <xref ref-type="supplementary-material" rid="app8">Multimedia Appendix 8</xref>.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Number of recalled features from the extracted features by MedRIA in the emergency and pediatrics tasks.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="120"/>
            <col width="120"/>
            <col width="110"/>
            <col width="120"/>
            <col width="130"/>
            <col width="120"/>
            <col width="130"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td colspan="2">
                  <break/>
                </td>
                <td>Average SMH<sup>a</sup> features (95% CI)</td>
                <td>Average PE<sup>b</sup> features (95% CI)</td>
                <td>Average AE<sup>c</sup> features (95% CI)</td>
                <td>Average positive features<sup>d</sup> (95% CI)</td>
                <td>Average positive SMH features (95% CI)</td>
                <td>Average positive PE features (95% CI)</td>
                <td>Average positive AE features (95% CI)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="9">
                  <bold>Emergency</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physicians</td>
                <td>7.295 (7.26-7.332)</td>
                <td>5.291 (5.265-5.32)</td>
                <td>6.902 (6.793-7.011)</td>
                <td>6.83 (6.788-6.87)</td>
                <td>2.52 (2.503-2.538)</td>
                <td>2.527 (2.514-2.541)</td>
                <td>1.782 (1.749-1.813)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MedRIA</td>
                <td>4.31 (4.29-4.331)</td>
                <td>3.835 (3.808-3.865)</td>
                <td>2.483 (2.421-2.546)</td>
                <td>3.923 (3.897-3.954)</td>
                <td>1.363 (1.353-1.375)</td>
                <td>1.907 (1.894-1.92)</td>
                <td>0.653 (0.635-0.672)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Collaboration</td>
                <td>7.01 (6.978-7.043)</td>
                <td>5.222 (5.196-5.25)</td>
                <td>6.311 (6.206-6.415)</td>
                <td>6.543 (6.505-6.581)</td>
                <td>2.435 (2.418-2.452)</td>
                <td>2.501 (2.489-2.515)</td>
                <td>1.607 (1.576-1.636)</td>
              </tr>
              <tr valign="top">
                <td colspan="9">
                  <bold>Pediatrics</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Physicians</td>
                <td>7.522 (7.494-7.546)</td>
                <td>6.29 (6.269-6.312)</td>
                <td>6.617 (6.546-6.687)</td>
                <td>7.326 (7.294-7.357)</td>
                <td>2.692 (2.677-2.707)</td>
                <td>2.837 (2.826-2.848)</td>
                <td>1.797 (1.776-1.82)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MedRIA</td>
                <td>5.021 (5.001-5.04)</td>
                <td>4.639 (4.619-4.66)</td>
                <td>3.508 (3.452-3.565)</td>
                <td>4.852 (4.825-4.877)</td>
                <td>1.665 (1.654-1.675)</td>
                <td>2.24 (2.23-2.25)</td>
                <td>0.948 (0.931-0.965)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Collaboration</td>
                <td>7.461 (7.435-7.484)</td>
                <td>6.28 (6.258-6.302)</td>
                <td>6.427 (6.356-6.496)</td>
                <td>7.241 (7.209-7.27)</td>
                <td>2.672 (2.658-2.687)</td>
                <td>2.833 (2.822-2.844)</td>
                <td>1.736 (1.714-1.758)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>SMH: symptom and medical history.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>PE: physical examination.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>AE: auxiliary examination.</p>
            </fn>
            <fn id="table4fn4">
              <p><sup>d</sup>Refers to exhibited symptoms or laboratory test results showing out-of-range values.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>MedRIA and collaborative inquiry heat maps of the top 10 physician inquiry features in patients diagnosed with pharyngitis in the emergency task.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e54616_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>MedRIA and collaborative inquiry heat maps of the top 10 physician inquiry features in patients diagnosed with tonsillitis in the pediatrics task.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e54616_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Examples of the inquiry sequences of MedRIA on 3 patients diagnosed with pharyngitis.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="70"/>
            <col width="80"/>
            <col width="120"/>
            <col width="250"/>
            <col width="300"/>
            <col width="180"/>
            <thead>
              <tr valign="top">
                <td>Gender</td>
                <td>Age (y)</td>
                <td>Chief concern</td>
                <td>Inquiry sequences of SMH<sup>a</sup></td>
                <td>Inquiry sequences of PE<sup>b</sup></td>
                <td>Inquiry sequences of AE<sup>c</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Male</td>
                <td>26</td>
                <td>
                  <italic>Sore throat</italic>
                  <sup>d</sup>
                </td>
                <td><italic>Fever(0)</italic><sup>e</sup>, <italic>cough(0)</italic>, <italic>runny nose(0)</italic>, <italic>nasal congestion(0)</italic>, <italic>chest pain(0)</italic>, <italic>coughing up phlegm(0)</italic>, abdominal pain, diarrhea</td>
                <td><italic>Pharyngeal congestion(1)</italic>, <italic>enlarged tonsils(0)</italic>, <italic>moist rales(0)</italic>, <italic>dry rales(0)</italic>, lower limb edema, <italic>coarse breath sounds(0)</italic></td>
                <td>
                  <italic>Absolute monocyte count [complete blood count]</italic>
                  <sup>f</sup>
                </td>
              </tr>
              <tr valign="top">
                <td>Male</td>
                <td>50</td>
                <td>
                  <italic>Pharyngeal foreign body sensation</italic>
                </td>
                <td>Fever, <italic>cough(1)</italic>, <italic>sore throat(0)</italic>, runny nose, <italic>coughing up phlegm(0)</italic>, abdominal pain, diarrhea, vomiting, dizziness</td>
                <td><italic>Pharyngeal congestion(1)</italic>, <italic>enlarged tonsils(0)</italic>, <italic>moist rales(0)</italic>, <italic>dry rales(0)</italic>, <italic>coarse breath sounds(0)</italic>, rash</td>
                <td>Absolute monocyte count</td>
              </tr>
              <tr valign="top">
                <td>Male</td>
                <td>4</td>
                <td>
                  <italic>Fever</italic>
                </td>
                <td><italic>Cough(1)</italic>, runny nose, <italic>vomiting(0)</italic>, coughing up phlegm, <italic>diarrhea(0)</italic>, <italic>convulsions(0)</italic>, <italic>shortness of breath(0)</italic></td>
                <td><italic>Pharyngeal congestion(1)</italic>, <italic>coarse breath sounds(1)</italic>, <italic>enlarged tonsils(0)</italic>, <italic>hand and foot Rash(0)</italic>, <italic>dry rales(0)</italic>, normal muscle tone, <italic>moist rales(0)</italic></td>
                <td>
                  <italic>Absolute monocyte count [complete blood count]</italic>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>SMH: symptom and medical history.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>PE: physical examination.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>AE: auxiliary examination.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>Features belonging to the extracted features are italicized.</p>
            </fn>
            <fn id="table5fn5">
              <p><sup>e</sup>Feature values are indicated in parentheses.</p>
            </fn>
            <fn id="table5fn6">
              <p><sup>f</sup>Contents within square brackets represent the associated laboratory tests documented in the patient’s health record.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>External Validation</title>
        <p>We used external medical dialogues to evaluate MedRIA’s inquiry logic. These dialogues consist of inquiry sequences generated by physicians during medical consultations. Limited by the online scenario, the average length of the inquiry sequences was 3.905 (95% CI 3.744-4.076), consisting of 3.043 (95% CI 2.895-3.195) inquiries about SMH and PE features and 0.862 (95% CI 0.814-0.907) recommended AEs. Diagnoses based on such few features were unreliable, so we primarily focused on evaluating MedRIA’s own inquiry order. As a result, MedRIA matched 64% (1.946/3.043; 95% CI 1.835-2.058) of the inquiries in the inquiry sequences and 28% (0.244/0.862; 95% CI 0.218-0.269) of recommended AEs. We compared the order of MedRIA’s inquiries to the inquiry sequences of physicians. The normalized Kendall τ distance was 0.323 (95% CI 0.301-0.346). It indicated that only 32.3% of pairs of inquiry features differed in ordering, demonstrating MedRIA’s consistency with physicians and reasonable inquiry logic.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this study, we proposed a reinforcement learning medical inquiry assistant, MedRIA, aiming to provide inquiry recommendations for medical investigation processes. The variety of questions that can be asked during the medical investigation process, especially when it incorporates PEs and AEs, poses a significant challenge. In addition, patients vary in their understanding of their health status and their ability to articulate it. To address these issues, MedRIA uses an actor-critic framework [<xref ref-type="bibr" rid="ref28">28</xref>]. The actor incorporates a pretrained VAE [<xref ref-type="bibr" rid="ref31">31</xref>] to recommend actions based on conditional probability distributions between observed and unobserved patient information. MedRIA uses a supervised diagnostic prediction model to aid in action selection, ensuring that the actor suggests inquiries that contribute to accurate diagnoses. In addition, MedRIA places significant emphasis on crafting a reward function to guide the reinforcement learning process.</p>
        <p>The superiority of these designs in MedRIA was verified in our retrospective experiments. When conducting its own inquiries in both emergency and pediatrics scenarios, MedRIA demonstrated comparable diagnostic prediction performance on AUROCs with that of physicians and even achieved a higher AUROC in the pediatrics setting. This was accomplished with MedRIA obtaining only 55% (10.628/19.488) and 64% (13.168/20.429) of the information that physicians received in making the final diagnosis in the emergency and pediatrics tasks, respectively. It is important to consider that AI, similarly to MedRIA, has the capacity to identify subtle patterns within vast data sets, which physicians may overlook. This inherent capability often leads to divergence from the inquiry logic of individual clinicians, as evidenced in our experiments. Given that MedRIA has demonstrated its ability to identify important diagnostic features, such divergence should be considered acceptable as it may provide new insights. In addition, it is worth noting that our experiments were based on EHRs. Therefore, when MedRIA conducted its own inquiries, its performance might very well have been underestimated due to the unavailability of patient information that was not documented in the records.</p>
        <p>When MedRIA worked in simulated collaboration with physicians, it notably reduced the number of inquiries made by physicians to 46% (6.037/13.26; 95% CI 6.009-6.064) and 43% (6.245/14.364; 95% CI 6.225-6.269) while maintaining feature recall rates of 95% (18.543/19.488; 95% CI 18.425-18.657) and 99% (20.168/20.429; 95% CI 20.080-20.251) in the emergency and pediatrics scenarios, respectively. This reduction suggests that MedRIA’s recommendations are sufficiently informative to assist physicians in considering aspects they may have overlooked. The additional insights provided by AI recommendations have a significant impact on medical decision-making [<xref ref-type="bibr" rid="ref46">46</xref>]. By leveraging the insights provided by MedRIA, physicians can potentially make more informed decisions and arrive at more accurate diagnoses.</p>
        <p>The demonstration and analysis of MedRIA’s inquiry feature frequencies, as well as concrete inquiry sequences, reveal its clear inquiry logic for different diseases, which resembles the approach of physicians. The ability of MedRIA to emulate the diagnostic process of human physicians suggests that it has the potential to be a useful tool in medical education, particularly in regions or populations with limited medical resources. Junior health care practitioners can leverage MedRIA to enhance their diagnostic skills, benefiting from its structured and logical inquiry process.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Despite these promising results, it is essential to acknowledge certain limitations. First, the feature extraction process of EHRs requires careful feature engineering, which could be further refined. Second, while MedRIA excelled in adapting its inquiry logic, it is not immune to instances of missed inquiries. For example, the reliance on AEs of MedRIA is significantly lower than that of physicians. One potential solution is to enhance MedRIA by modeling the significance of inquiries for disease treatment. This is because the purpose of examinations may not be for diagnosis but to determine the severity of the disease to formulate appropriate treatment.</p>
        <p>Third, the composition of patient presentations can vary significantly between countries. For example, in some Western countries, only 5% to 20% of emergency [<xref ref-type="bibr" rid="ref47">47</xref>] or pediatrics [<xref ref-type="bibr" rid="ref48">48</xref>] outpatients are due to upper respiratory tract infections. The proportion in our data set was many times greater due to seasonal variations. We speculate that this may have arisen due to limited access to primary care, seasonal respiratory peaks during the autumn and winter months, greater COVID-19 awareness and fear, and our method of prioritizing the most frequent diagnoses. Changes in these factors, such as using summer data in China or winter data elsewhere, may influence accuracy. Furthermore, while MedRIA’s workflow is language independent, the evaluation of our system has been limited to a Chinese context. Further validation in other languages and health care settings is necessary to establish its broader applicability and effectiveness.</p>
        <p>Fourth, our AI system would be biased toward excess certainty if deployed in the real world as it lacks the humility to recognize its diagnostic limitations. Future work should include the AI system’s degree of confidence and manage corresponding clinical risks. Fifth, decision system developers must consider adopting safe integration systems to mitigate potential errors, especially for life-threatening conditions such as appendicitis, where risk aversion may be greater. Sixth, future work could incorporate MedRIA with the latest developments in LLMs [<xref ref-type="bibr" rid="ref49">49</xref>], which will assist in its future deployment and testing in clinical workflows.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In conclusion, MedRIA is a significant step toward enhancing health care decision-making processes. Its proficiency in medical inquiries, ability to identify important diagnostic features, and adaptability underscore its value as an AI-driven diagnostic assistant. While there are challenges to overcome, the results of this study show a prototype for sophisticated and effective AI applied in health care, ultimately benefiting both health care professionals and patients.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>The feature set of the emergency task.</p>
        <media xlink:href="jmir_v26i1e54616_app1.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 26 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>The feature set of the pediatrics task.</p>
        <media xlink:href="jmir_v26i1e54616_app2.xlsx" xlink:title="XLSX File  (Microsoft Excel File), 28 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Implementation details of MedRIA.</p>
        <media xlink:href="jmir_v26i1e54616_app3.docx" xlink:title="DOCX File , 22 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Receiver operating characteristic curves of all diseases in the emergency and pediatrics tasks.</p>
        <media xlink:href="jmir_v26i1e54616_app4.docx" xlink:title="DOCX File , 2682 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Performance of MedRIA in more generalizable emergency and pediatrics tasks.</p>
        <media xlink:href="jmir_v26i1e54616_app5.docx" xlink:title="DOCX File , 21 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Inquiry frequencies of the top 10 physician inquiry features in patients diagnosed with pharyngitis in the emergency task and tonsillitis in the pediatrics task.</p>
        <media xlink:href="jmir_v26i1e54616_app6.png" xlink:title="PNG File , 92 KB"/>
      </supplementary-material>
      <supplementary-material id="app7">
        <label>Multimedia Appendix 7</label>
        <p>Tree diagram of the inquiry features of MedRIA for 4 patients diagnosed with pharyngitis in the emergency task. These 4 patients shared similar characteristics, all being male with ages ranging from 31 to 32 years and complaining of sore throat. The numbers in brackets indicate the timesteps of inquiries.</p>
        <media xlink:href="jmir_v26i1e54616_app7.docx" xlink:title="DOCX File , 215 KB"/>
      </supplementary-material>
      <supplementary-material id="app8">
        <label>Multimedia Appendix 8</label>
        <p>Inquiry frequencies of the physician and MedRIA and inquiry heat maps of MedRIA and the collaborative inquiry in the emergency and pediatrics tasks.</p>
        <media xlink:href="jmir_v26i1e54616_app8.docx" xlink:title="DOCX File , 8348 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AE</term>
          <def>
            <p>auxiliary examination</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">AUROC</term>
          <def>
            <p>area under the receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">CDSS</term>
          <def>
            <p>clinical decision support system</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">MedBERT</term>
          <def>
            <p>Medical Bidirectional Encoder Representations From Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">MLP</term>
          <def>
            <p>multilayer perceptron</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">PE</term>
          <def>
            <p>physical examination</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">SMH</term>
          <def>
            <p>symptom and medical history</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">VAE</term>
          <def>
            <p>variational autoencoder</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work is supported by the National Key R&#38;D Program of China (2021YFF1201303 and 2022YFC2703105), Guoqiang Institute of Tsinghua University, and Beijing National Research Center for Information Science and Technology. The funders had no role in the study design, data collection and analysis, the decision to publish, or the preparation of the manuscript.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Musen</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Middleton</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Greenes</surname>
              <given-names>RA</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Shortliffe</surname>
              <given-names>EH</given-names>
            </name>
            <name name-style="western">
              <surname>Cimino</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>Clinical decision-support systems</article-title>
          <source>Biomedical Informatics: Computer Applications in Health Care and Biomedicine</source>
          <year>2021</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>795</fpage>
          <lpage>840</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sutton</surname>
              <given-names>RT</given-names>
            </name>
            <name name-style="western">
              <surname>Pincock</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Baumgart</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Sadowski</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Fedorak</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>Kroeker</surname>
              <given-names>KI</given-names>
            </name>
          </person-group>
          <article-title>An overview of clinical decision support systems: benefits, risks, and strategies for success</article-title>
          <source>NPJ Digit Med</source>
          <year>2020</year>
          <volume>3</volume>
          <fpage>17</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32047862"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-020-0221-y</pub-id>
          <pub-id pub-id-type="medline">32047862</pub-id>
          <pub-id pub-id-type="pii">221</pub-id>
          <pub-id pub-id-type="pmcid">PMC7005290</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berner</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Graber</surname>
              <given-names>ML</given-names>
            </name>
          </person-group>
          <article-title>Overconfidence as a cause of diagnostic error in medicine</article-title>
          <source>Am J Med</source>
          <year>2008</year>
          <month>05</month>
          <volume>121</volume>
          <issue>5 Suppl</issue>
          <fpage>S2</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.1016/j.amjmed.2008.01.001</pub-id>
          <pub-id pub-id-type="medline">18440350</pub-id>
          <pub-id pub-id-type="pii">S0002-9343(08)00040-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bornstein</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Emler</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>Rationality in medical decision making: a review of the literature on doctors' decision-making biases</article-title>
          <source>J Eval Clin Pract</source>
          <year>2001</year>
          <month>05</month>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>97</fpage>
          <lpage>107</lpage>
          <pub-id pub-id-type="doi">10.1046/j.1365-2753.2001.00284.x</pub-id>
          <pub-id pub-id-type="medline">11489035</pub-id>
          <pub-id pub-id-type="pii">jep284</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shickel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tighe</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bihorac</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rashidi</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Deep EHR: a survey of recent advances in deep learning techniques for electronic health record (EHR) analysis</article-title>
          <source>IEEE J Biomed Health Inform</source>
          <year>2018</year>
          <month>09</month>
          <volume>22</volume>
          <issue>5</issue>
          <fpage>1589</fpage>
          <lpage>604</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29989977"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/JBHI.2017.2767063</pub-id>
          <pub-id pub-id-type="medline">29989977</pub-id>
          <pub-id pub-id-type="pmcid">PMC6043423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rajpurkar</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Banerjee</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Topol</surname>
              <given-names>EJ</given-names>
            </name>
          </person-group>
          <article-title>AI in health and medicine</article-title>
          <source>Nat Med</source>
          <year>2022</year>
          <month>01</month>
          <day>20</day>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>31</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-021-01614-0</pub-id>
          <pub-id pub-id-type="medline">35058619</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-021-01614-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tsui</surname>
              <given-names>BY</given-names>
            </name>
            <name name-style="western">
              <surname>Ni</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Valentim</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Baxter</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kermany</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tian</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hewett</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ling</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ou</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hou</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Duan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gibson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>ED</given-names>
            </name>
            <name name-style="western">
              <surname>Karin</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pizzato</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Haw</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Goldbaum</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tremoulet</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Carter</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Evaluation and accurate diagnoses of pediatric diseases using artificial intelligence</article-title>
          <source>Nat Med</source>
          <year>2019</year>
          <month>03</month>
          <volume>25</volume>
          <issue>3</issue>
          <fpage>433</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-018-0335-9</pub-id>
          <pub-id pub-id-type="medline">30742121</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-018-0335-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>HY</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>A transformer-based representation-learning model with unified processing of multimodal input for clinical diagnostics</article-title>
          <source>Nat Biomed Eng</source>
          <year>2023</year>
          <month>06</month>
          <day>12</day>
          <volume>7</volume>
          <issue>6</issue>
          <fpage>743</fpage>
          <lpage>55</lpage>
          <pub-id pub-id-type="doi">10.1038/s41551-023-01045-x</pub-id>
          <pub-id pub-id-type="medline">37308585</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41551-023-01045-x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Pareek</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Seyyedi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Banerjee</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Lungren</surname>
              <given-names>MP</given-names>
            </name>
          </person-group>
          <article-title>Fusion of medical imaging and electronic health records using deep learning: a systematic review and implementation guidelines</article-title>
          <source>NPJ Digit Med</source>
          <year>2020</year>
          <month>10</month>
          <day>16</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>136</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-020-00341-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-020-00341-z</pub-id>
          <pub-id pub-id-type="medline">33083571</pub-id>
          <pub-id pub-id-type="pii">341</pub-id>
          <pub-id pub-id-type="pmcid">PMC7567861</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rajkomar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Oren</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Hajaj</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hardt</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Marcus</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sundberg</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Yee</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Flores</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Duggan</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Irvine</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Le</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Litsch</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mossin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tansuwan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wexler</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ludwig</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Volchenboum</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pearson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Madabushi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
            <name name-style="western">
              <surname>Butte</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Howell</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Scalable and accurate deep learning with electronic health records</article-title>
          <source>NPJ Digit Med</source>
          <year>2018</year>
          <month>5</month>
          <day>8</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>18</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-018-0029-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-018-0029-1</pub-id>
          <pub-id pub-id-type="medline">31304302</pub-id>
          <pub-id pub-id-type="pii">29</pub-id>
          <pub-id pub-id-type="pmcid">PMC6550175</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Suk</surname>
              <given-names>HI</given-names>
            </name>
          </person-group>
          <article-title>Deep learning in medical image analysis</article-title>
          <source>Annu Rev Biomed Eng</source>
          <year>2017</year>
          <month>06</month>
          <day>21</day>
          <volume>19</volume>
          <fpage>221</fpage>
          <lpage>48</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28301734"/>
          </comment>
          <pub-id pub-id-type="doi">10.1146/annurev-bioeng-071516-044442</pub-id>
          <pub-id pub-id-type="medline">28301734</pub-id>
          <pub-id pub-id-type="pmcid">PMC5479722</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hosny</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Parmar</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Quackenbush</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Aerts</surname>
              <given-names>HJ</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in radiology</article-title>
          <source>Nat Rev Cancer</source>
          <year>2018</year>
          <month>12</month>
          <volume>18</volume>
          <issue>8</issue>
          <fpage>500</fpage>
          <lpage>10</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29777175"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41568-018-0016-5</pub-id>
          <pub-id pub-id-type="medline">29777175</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41568-018-0016-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC6268174</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Litjens</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kooi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Bejnordi</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Setio</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Ciompi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ghafoorian</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>van der Laak</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>van Ginneken</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Sánchez</surname>
              <given-names>CI</given-names>
            </name>
          </person-group>
          <article-title>A survey on deep learning in medical image analysis</article-title>
          <source>Medical Image Analysis</source>
          <year>2017</year>
          <month>12</month>
          <volume>42</volume>
          <fpage>60</fpage>
          <lpage>88</lpage>
          <pub-id pub-id-type="doi">10.1016/J.MEDIA.2017.07.005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hernàndez-Lobato</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>BSODA: a bipartite scalable framework for online disease diagnosis</article-title>
          <source>Proceedings of the 2022 ACM Web Conference</source>
          <year>2022</year>
          <conf-name>WWW '22</conf-name>
          <conf-date>April 25-29, 2022</conf-date>
          <conf-loc>Virtual Event</conf-loc>
          <fpage>2511</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/3485447.3512123"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3485447.3512123</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Diaformer: automatic diagnosis via symptoms sequence generation</article-title>
          <source>Proceedings of the 36th AAAI Conference on Artificial Intelligence</source>
          <year>2022</year>
          <conf-name>AAAI '22</conf-name>
          <conf-date>February 22–March 1, 2022</conf-date>
          <conf-loc>Virtual Event</conf-loc>
          <fpage>4432</fpage>
          <lpage>40</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cdn.aaai.org/ojs/20365/20365-13-24378-1-2-20220628.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.1609/aaai.v36i4.20365</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Dialogue based disease screening through domain customized reinforcement learning</article-title>
          <source>Proceedings of the 27th ACM SIGKDD Conference on Knowledge Discovery &#38; Data Mining</source>
          <year>2021</year>
          <conf-name>KDD '21</conf-name>
          <conf-date>August 14-18, 2021</conf-date>
          <conf-loc>Virtual Event</conf-loc>
          <fpage>1120</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/3447548.3467255"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3447548.3467255</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Generative adversarial regularized mutual information policy gradient framework for automatic diagnosis</article-title>
          <source>Proc AAAI Conf Artif Intell</source>
          <year>2020</year>
          <month>04</month>
          <day>03</day>
          <volume>34</volume>
          <issue>01</issue>
          <fpage>1062</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1609/aaai.v34i01.5456</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Hierarchical reinforcement learning for automatic disease diagnosis</article-title>
          <source>Bioinformatics</source>
          <year>2022</year>
          <month>08</month>
          <day>10</day>
          <volume>38</volume>
          <issue>16</issue>
          <fpage>3995</fpage>
          <lpage>4001</lpage>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btac408</pub-id>
          <pub-id pub-id-type="medline">35775965</pub-id>
          <pub-id pub-id-type="pii">6625731</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>“My nose is running.” “Are you also coughing?”: building a medical diagnosis agent with interpretable inquiry logics</article-title>
          <source>Proceedings of the 31st International Joint Conference on Artificial Intelligence</source>
          <year>2022</year>
          <conf-name>IJCAI '22</conf-name>
          <conf-date>July 23-29, 2022</conf-date>
          <conf-loc>Vienna, Austria</conf-loc>
          <fpage>4266</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ijcai.org/proceedings/2022/0592.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.24963/ijcai.2022/592</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Online disease diagnosis with inductive heterogeneous graph convolutional networks</article-title>
          <source>Proceedings of the 2021 Web Conference</source>
          <year>2021</year>
          <conf-name>WWW '21</conf-name>
          <conf-date>April 19-23, 2021</conf-date>
          <conf-loc>Ljubljana, Slovenia</conf-loc>
          <fpage>3349</fpage>
          <lpage>58</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/3442381.3449795"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3442381.3449795</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Towards causality-aware inferring: a sequential discriminative approach for medical diagnosis</article-title>
          <source>IEEE Trans Pattern Anal Mach Intell</source>
          <year>2021</year>
          <fpage>1</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1109/tpami.2023.3292363</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ouyang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Almeida</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wainwright</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mishkin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Slama</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ray</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schulman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hilton</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kelton</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Training language models to follow instructions with human feedback</article-title>
          <source>arXiv. Preprint posted online March 4, 2022</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2203.02155"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kung</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Cheatham</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Medenilla</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sillos</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>De Leon</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Elepaño</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Madriaga</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Aggabao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Diaz-Candido</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Maningo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tseng</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Performance of ChatGPT on USMLE: potential for AI-assisted medical education using large language models</article-title>
          <source>PLOS Digit Health</source>
          <year>2023</year>
          <month>02</month>
          <day>9</day>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>e0000198</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36812645"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pdig.0000198</pub-id>
          <pub-id pub-id-type="medline">36812645</pub-id>
          <pub-id pub-id-type="pii">PDIG-D-22-00371</pub-id>
          <pub-id pub-id-type="pmcid">PMC9931230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meskó</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Topol</surname>
              <given-names>EJ</given-names>
            </name>
          </person-group>
          <article-title>The imperative for regulatory oversight of large language models (or generative AI) in healthcare</article-title>
          <source>NPJ Digit Med</source>
          <year>2023</year>
          <month>07</month>
          <day>06</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>120</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-023-00873-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-023-00873-0</pub-id>
          <pub-id pub-id-type="medline">37414860</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-023-00873-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC10326069</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thirunavukarasu</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Elangovan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gutierrez</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>TF</given-names>
            </name>
            <name name-style="western">
              <surname>Ting</surname>
              <given-names>DS</given-names>
            </name>
          </person-group>
          <article-title>Large language models in medicine</article-title>
          <source>Nat Med</source>
          <year>2023</year>
          <month>08</month>
          <day>17</day>
          <volume>29</volume>
          <issue>8</issue>
          <fpage>1930</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-023-02448-8</pub-id>
          <pub-id pub-id-type="medline">37460753</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-023-02448-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wornow</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Thapa</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Steinberg</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Fleming</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pfeffer</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Fries</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>NH</given-names>
            </name>
          </person-group>
          <article-title>The shaky foundations of large language models and foundation models for electronic health records</article-title>
          <source>NPJ Digit Med</source>
          <year>2023</year>
          <month>07</month>
          <day>29</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>135</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-023-00879-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-023-00879-8</pub-id>
          <pub-id pub-id-type="medline">37516790</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-023-00879-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC10387101</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>ChatGPT’s alter ego, Dan: users jailbreak AI program to get around ethical safeguards</article-title>
          <source>The Guardian</source>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.theguardian.com/technology/2023/mar/08/chatgpt-alter-ego-dan-users-jailbreak-ai-program-to-get-around-ethical-safeguards">https://www.theguardian.com/technology/2023/mar/08/chatgpt-alter-ego-dan-users-jailbreak-ai-program-to-get-around-​ethical-safeguards</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mnih</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Badia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mirza</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Graves</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lillicrap</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Harley</surname>
              <given-names>TP</given-names>
            </name>
            <name name-style="western">
              <surname>Silver</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kavukcuoglu</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Asynchronous methods for deep reinforcement learning</article-title>
          <source>Proceedings of the 33rd International Conference on International Conference on Machine Learning</source>
          <year>2016</year>
          <conf-name>ICML'16</conf-name>
          <conf-date>June 19-24, 2016</conf-date>
          <conf-loc>New York, NY</conf-loc>
          <fpage>1928</fpage>
          <lpage>37</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.5555/3045390.3045594"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Balogh</surname>
              <given-names>EP</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>BT</given-names>
            </name>
            <name name-style="western">
              <surname>Ball</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <source>Improving Diagnosis in Health Care</source>
          <year>2015</year>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>The National Academies Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kenton</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>LK</given-names>
            </name>
          </person-group>
          <article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</source>
          <year>2019</year>
          <conf-name>NAACL-HLT '19</conf-name>
          <conf-date>June 2-7, 2019</conf-date>
          <conf-loc>Minneapolis, MN</conf-loc>
          <fpage>4171</fpage>
          <lpage>86</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/N19-1423.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/N19-1423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kingma</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Welling</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Auto-encoding variational bayes</article-title>
          <source>arXiv. Preprint posted online December 20, 2013</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1312.6114"/>
          </comment>
          <pub-id pub-id-type="doi">10.61603/ceas.v2i1.33</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schulman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wolski</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Dhariwal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Radford</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Klimov</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Proximal policy optimization algorithms</article-title>
          <source>arXiv. Preprint posted online July 20, 2017</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1707.06347"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Konda</surname>
              <given-names>VR</given-names>
            </name>
            <name name-style="western">
              <surname>Tsitsiklis</surname>
              <given-names>JN</given-names>
            </name>
          </person-group>
          <article-title>OnActor-critic algorithms</article-title>
          <source>SIAM J Control Optim</source>
          <year>2003</year>
          <month>01</month>
          <volume>42</volume>
          <issue>4</issue>
          <fpage>1143</fpage>
          <lpage>66</lpage>
          <pub-id pub-id-type="doi">10.1137/S0363012901385691</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schulman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Moritz</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Levine</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Abbeel</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>High-dimensional continuous control using generalized advantage estimation</article-title>
          <source>arXiv. Preprint posted online June 8, 2015</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1506.02438"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1506.02438</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kingma</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Ba</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Adam: a method for stochastic optimization</article-title>
          <source>arXiv. Preprint posted online December 22, 2014</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1412.6980"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Paszke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gross</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Massa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lerer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bradbury</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chanan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Killeen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gimelshein</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Antiga</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Desmaison</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Köpf</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>PyTorch: an imperative style, high-performance deep learning library</article-title>
          <source>arXiv. Preprint posted online December 3, 2019</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1912.01703"/>
          </comment>
          <pub-id pub-id-type="doi">10.7551/mitpress/11474.003.0014</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>You</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Duburcq</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Tianshou: a highly modularized deep reinforcement learning library</article-title>
          <source>J Mach Learn Res</source>
          <year>2022</year>
          <volume>23</volume>
          <issue>267</issue>
          <fpage>1</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jmlr.org/papers/volume23/21-1127/21-1127.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bellman</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>A markovian decision process</article-title>
          <source>Indiana Univ Math J</source>
          <year>1957</year>
          <volume>6</volume>
          <issue>4</issue>
          <fpage>679</fpage>
          <lpage>84</lpage>
          <pub-id pub-id-type="doi">10.1512/iumj.1957.6.56038</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Scalable online disease diagnosis via multi-model-fused actor-critic reinforcement learning</article-title>
          <source>Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining</source>
          <year>2022</year>
          <conf-name>KDD '22</conf-name>
          <conf-date>August 14-18, 2022</conf-date>
          <conf-loc>Washington, DC</conf-loc>
          <fpage>4695</fpage>
          <lpage>703</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/3534678.3542672"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3534678.3542672</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Goodman</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Multimodal generative models for scalable weakly-supervised learning</article-title>
          <source>arXiv. Preprint posted online February 14, 2018</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1802.05335#:~:text=Multimodal%20Generative%20Models%20for%20Scalable%20Weakly%2DSupervised%20Learning,-Mike%20Wu%2C%20Noah&#38;text=Multiple%20modalities%20often%20co%2Doccur,deeper%20and%20more%20useful%20representations"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>QI</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>A benchmark for automatic medical consultation system: frameworks, tasks and datasets</article-title>
          <source>Bioinformatics</source>
          <year>2023</year>
          <month>01</month>
          <day>01</day>
          <volume>39</volume>
          <issue>1</issue>
          <fpage>btac817</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36539203"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btac817</pub-id>
          <pub-id pub-id-type="medline">36539203</pub-id>
          <pub-id pub-id-type="pii">6947983</pub-id>
          <pub-id pub-id-type="pmcid">PMC9848052</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Finley</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>LightGBM: a highly efficient gradient boosting decision tree</article-title>
          <source>Proceedings of the 31st International Conference on Neural Information Processing Systems</source>
          <year>2017</year>
          <conf-name>NIPS '17</conf-name>
          <conf-date>December 4-9, 2017</conf-date>
          <conf-loc>Long Beach, CA</conf-loc>
          <fpage>3149</fpage>
          <lpage>57</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.5555/3294996.3295074"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>HG</given-names>
            </name>
            <name name-style="western">
              <surname>Van Gog</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Schuit</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Van den Berge</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Van Daele</surname>
              <given-names>PL</given-names>
            </name>
            <name name-style="western">
              <surname>Bueving</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Van der Zee</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Van den Broek</surname>
              <given-names>WW</given-names>
            </name>
            <name name-style="western">
              <surname>Van Saase</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Mamede</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Do patients' disruptive behaviours influence the accuracy of a doctor's diagnosis? A randomised experiment</article-title>
          <source>BMJ Qual Saf</source>
          <year>2017</year>
          <month>01</month>
          <day>07</day>
          <volume>26</volume>
          <issue>1</issue>
          <fpage>19</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.1136/bmjqs-2015-004109</pub-id>
          <pub-id pub-id-type="medline">26951795</pub-id>
          <pub-id pub-id-type="pii">bmjqs-2015-004109</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mamede</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>van Gog</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>van den Berge</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Rikers</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>van Saase</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>van Guldener</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>HG</given-names>
            </name>
          </person-group>
          <article-title>Effect of availability bias and reflective reasoning on diagnostic accuracy among internal medicine residents</article-title>
          <source>JAMA</source>
          <year>2010</year>
          <month>09</month>
          <day>15</day>
          <volume>304</volume>
          <issue>11</issue>
          <fpage>1198</fpage>
          <lpage>203</lpage>
          <pub-id pub-id-type="doi">10.1001/jama.2010.1276</pub-id>
          <pub-id pub-id-type="medline">20841533</pub-id>
          <pub-id pub-id-type="pii">304/11/1198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>REFUEL: exploring sparse features in deep reinforcement learning for fast disease diagnosis</article-title>
          <source>Proceedings of the 32nd International Conference on Neural Information Processing Systems</source>
          <year>2018</year>
          <conf-name>NIPS'18</conf-name>
          <conf-date>December 3-8, 2018</conf-date>
          <conf-loc>Montréal, QC</conf-loc>
          <fpage>7333</fpage>
          <lpage>42</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.5555/3327757.3327834"/>
          </comment>
          <pub-id pub-id-type="doi">10.7551/mitpress/11474.003.0014</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nagendran</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Festor</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Komorowski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gordon</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Faisal</surname>
              <given-names>AA</given-names>
            </name>
          </person-group>
          <article-title>Quantifying the impact of AI recommendations with explanations on prescription decision making</article-title>
          <source>NPJ Digit Med</source>
          <year>2023</year>
          <month>11</month>
          <day>07</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>206</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-023-00955-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-023-00955-z</pub-id>
          <pub-id pub-id-type="medline">37935953</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-023-00955-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC10630476</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nørgaard</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Mogensen</surname>
              <given-names>CB</given-names>
            </name>
            <name name-style="western">
              <surname>Teglbjærg</surname>
              <given-names>LS</given-names>
            </name>
            <name name-style="western">
              <surname>Brabrand</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lassen</surname>
              <given-names>AT</given-names>
            </name>
          </person-group>
          <article-title>Diagnostic packages can be assigned accurately in emergency departments. A multi-centre cohort study</article-title>
          <source>Dan Med J</source>
          <year>2016</year>
          <month>06</month>
          <volume>63</volume>
          <issue>6</issue>
          <fpage>A5240</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ugeskriftet.dk/dmj/A5240"/>
          </comment>
          <pub-id pub-id-type="medline">27264941</pub-id>
          <pub-id pub-id-type="pii">A5240</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hiscock</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Efron</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sewell</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Bryson</surname>
              <given-names>HE</given-names>
            </name>
            <name name-style="western">
              <surname>Price</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Oberklaid</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>South</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wake</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Children attending paediatricians study: a national prospective audit of outpatient practice from the Australian paediatric research network</article-title>
          <source>Med J Aust</source>
          <year>2011</year>
          <month>04</month>
          <day>18</day>
          <volume>194</volume>
          <issue>8</issue>
          <fpage>392</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.5694/j.1326-5377.2011.tb03028.x</pub-id>
          <pub-id pub-id-type="medline">21495938</pub-id>
          <pub-id pub-id-type="pii">his10241_fm</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moor</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Banerjee</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Abad</surname>
              <given-names>ZS</given-names>
            </name>
            <name name-style="western">
              <surname>Krumholz</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Leskovec</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Topol</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rajpurkar</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Foundation models for generalist medical artificial intelligence</article-title>
          <source>Nature</source>
          <year>2023</year>
          <month>04</month>
          <day>12</day>
          <volume>616</volume>
          <issue>7956</issue>
          <fpage>259</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.1038/s41586-023-05881-4</pub-id>
          <pub-id pub-id-type="medline">37045921</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41586-023-05881-4</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
