<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
    <article-id pub-id-type="publisher-id">v19i6e220</article-id>
    <article-id pub-id-type="pmid">28634156</article-id>
    <article-id pub-id-type="doi">10.2196/jmir.7156</article-id>
    <article-categories>
      <subj-group subj-group-type="heading">
        <subject>Original Paper</subject>
      </subj-group>
      <subj-group subj-group-type="article-type">
        <subject>Original Paper</subject>
      </subj-group>
    </article-categories>
    <title-group>
      <article-title>Classifying Chinese Questions Related to Health Care Posted by Consumers Via the Internet</article-title>
    </title-group>
    <contrib-group>
      <contrib contrib-type="editor">
        <name>
          <surname>Eysenbach</surname>
          <given-names>Gunther</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Zheng</surname>
          <given-names>Shuai</given-names>
        </name>
      </contrib>
      <contrib contrib-type="reviewer">
        <name>
          <surname>Peng</surname>
          <given-names>Yifan</given-names>
        </name>
      </contrib>
    </contrib-group>
    <contrib-group>
      <contrib contrib-type="author" id="contrib1">
        <name name-style="western">
          <surname>Guo</surname>
          <given-names>Haihong</given-names>
        </name>
        <degrees>MSc</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-1218-7998</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib2">
        <name name-style="western">
          <surname>Na</surname>
          <given-names>Xu</given-names>
        </name>
        <degrees>MSc</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-4038-1410</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib3">
        <name name-style="western">
          <surname>Hou</surname>
          <given-names>Li</given-names>
        </name>
        <degrees>PhD</degrees>
        <xref rid="aff1" ref-type="aff">1</xref>
        <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-4182-8691</ext-link>
      </contrib>
      <contrib contrib-type="author" id="contrib4" corresp="yes">
      <name name-style="western">
        <surname>Li</surname>
        <given-names>Jiao</given-names>
      </name>
      <degrees>PhD</degrees>
      <xref rid="aff1" ref-type="aff">1</xref>
      <address>
        <institution>Institute of Medical Information &#38; Library, Chinese Academy of Medical Sciences</institution>
        <addr-line>3rd Yabao Road Chaoyang District</addr-line>
        <addr-line>Beijing, 100020</addr-line>
        <country>China</country>
        <phone>86 01052328740</phone>
        <fax>86 01052328610</fax>
        <email>li.jiao@imicams.ac.cn</email>
      </address>  
      <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-6391-8343</ext-link></contrib>
    </contrib-group>
    <aff id="aff1">
      <sup>1</sup>
      <institution>Institute of Medical Information &#38; Library, Chinese Academy of Medical Sciences</institution>
      <addr-line>Beijing</addr-line>
      <country>China</country>
    </aff>
    <author-notes>
      <corresp>Corresponding Author: Jiao Li 
      <email>li.jiao@imicams.ac.cn</email></corresp>
    </author-notes>
    <pub-date pub-type="collection"><month>06</month><year>2017</year></pub-date>
    <pub-date pub-type="epub">
      <day>20</day>
      <month>06</month>
      <year>2017</year>
    </pub-date>
    <volume>19</volume>
    <issue>6</issue>
    <elocation-id>e220</elocation-id>
    <!--history from ojs - api-xml-->
    <history>
      <date date-type="received">
        <day>14</day>
        <month>12</month>
        <year>2016</year>
      </date>
      <date date-type="rev-request">
        <day>23</day>
        <month>2</month>
        <year>2017</year>
      </date>
      <date date-type="rev-recd">
        <day>20</day>
        <month>4</month>
        <year>2017</year>
      </date>
      <date date-type="accepted">
        <day>20</day>
        <month>4</month>
        <year>2017</year>
      </date>
    </history>
    <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
    <copyright-statement>©Haihong Guo, Xu Na, Li Hou, Jiao Li. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 20.06.2017.</copyright-statement>
    <copyright-year>2017</copyright-year>
    <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
      <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
    </license>  
    <self-uri xlink:href="http://www.jmir.org/2017/6/e220/" xlink:type="simple"/>
    <abstract>
      <sec sec-type="background">
        <title>Background</title>
        <p>In question answering (QA) system development, question classification is crucial for identifying information needs and improving the accuracy of returned answers. Although the questions are domain-specific, they are asked by non-professionals, making the question classification task more challenging.</p>
      </sec>
      <sec sec-type="objective">
        <title>Objective</title>
        <p>This study aimed to classify health care–related questions posted by the general public (Chinese speakers) on the Internet.</p>
      </sec>
      <sec sec-type="methods">
        <title>Methods</title>
        <p>A topic-based classification schema for health-related questions was built by manually annotating randomly selected questions. The Kappa statistic was used to measure the interrater reliability of multiple annotation results. Using the above corpus, we developed a machine-learning method to automatically classify these questions into one of the following six classes: <italic>Condition Management</italic>, <italic>Healthy Lifestyle</italic>, <italic>Diagnosis</italic>, <italic>Health Provider Choice</italic>, <italic>Treatment</italic>, and <italic>Epidemiology</italic>.</p>
      </sec>
      <sec sec-type="results">
        <title>Results</title>
        <p>The consumer health question schema was developed with a four-hierarchical-level of specificity, comprising 48 quaternary categories and 35 annotation rules. The 2000 sample questions were coded with 2000 major codes and 607 minor codes. Using natural language processing techniques, we expressed the Chinese questions as a set of lexical, grammatical, and semantic features. Furthermore, the effective features were selected to improve the question classification performance. From the 6-category classification results, we achieved an average precision of 91.41%, recall of 89.62%, and <italic>F</italic><sub>1</sub> score of 90.24%.</p>
      </sec>
      <sec sec-type="conclusions">
        <title>Conclusions</title>
        <p>In this study, we developed an automatic method to classify questions related to Chinese health care posted by the general public. It enables Artificial Intelligence (AI) agents to understand Internet users’ information needs on health care.</p>
      </sec>
    </abstract>
    <kwd-group>
      <kwd>classification</kwd>
      <kwd>natural language processing</kwd>
      <kwd>hypertension</kwd>
      <kwd>consumer health information</kwd>
    </kwd-group></article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The Internet is increasingly becoming a main resource for consumers to acquire health information. Until December 2015, there were 152 million Internet health users in China, indicating that 22.1% of Chinese Internet users have looked online for health information and services [<xref ref-type="bibr" rid="ref1">1</xref>]. Many studies have proved that health-related information online could impact consumers’ health-related attitudes and behaviors [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref4">4</xref>]. However, consumers have difficulty in expressing their information needs accurately using medical query terms, thus failing to retrieve relevant health information [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. Automatic question answering (QA) systems are available for such users and they respond with concise and correct answers using natural language processing techniques. Thus the QA systems have become one of the most important research focuses in the field of biomedicine [<xref ref-type="bibr" rid="ref7">7</xref>].</p>
      <p>In general, a QA system consists of 3 modules: question analysis, information retrieval, and answer extraction. In the first module, question classification plays an important role in identifying the information needs of consumers, reducing the space of candidate answers, and further improving the accuracy of returned answers [<xref ref-type="bibr" rid="ref8">8</xref>]. Classification schema is the basis of question classification. However, due to the difference in the information needs of health providers and consumers [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref11">11</xref>], the existing question classification schemas for professional health-related questions (the International Classification of Primary Care [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>], the Taxonomies of Generic Clinical Questions (TGCQ) [<xref ref-type="bibr" rid="ref14">14</xref>], etc) are not suitable for consumer health questions. Although some research focuses on the classification schema of consumer health questions [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>], it has not been defined in a systematic manner yet. Therefore, it is a prerequisite to design a concise and valid classification schema.</p>
      <p>Several studies have been conducted for automatic quesiton classification in the field of health and medicine in order to identify the general topics of clinical questions [<xref ref-type="bibr" rid="ref17">17</xref>], distinguish between answerable and unanswerable intensive care unit (ICU) questions [<xref ref-type="bibr" rid="ref18">18</xref>], separate consumer health questions from professional medical questions [<xref ref-type="bibr" rid="ref19">19</xref>], and classify the types of consumer health questions [<xref ref-type="bibr" rid="ref20">20</xref>]. Research has demonstrated that support vector machines (SVMs) performed the best among the most commonly explored algorithms, including naive bayesian, decision tree, maximum entropy, logistic regression, and conditional random fields. However, different patterns of thinking and habits of Chinese expression offen cause a mass of difference in the flexibility of word order and parse for Chinese health questions [<xref ref-type="bibr" rid="ref21">21</xref>]. Several studies on Chinese NLP focused on clinical named entity recognition [<xref ref-type="bibr" rid="ref22">22</xref>], diseases, or drag-related clinical information extraction [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>] and speculation detection [<xref ref-type="bibr" rid="ref25">25</xref>] from the free-text of pathology and operation notes. The main challenges in these tasks were word segmentation and feature representation and selection. To our knowledge, few studies have investigated consumer health question classification in Chinese.</p>
      <p>As one of the most common chronic diseases, hypertension has become the main risk factor of cardiovascular diseases. It was estimated that China had 270 million patients with hypertension in 2012, and the incidence rate was approximately 3% per year [<xref ref-type="bibr" rid="ref26">26</xref>]. Thus, hypertension-related questions are frequently asked with large variability on the Internet. For this reason, this study aimed at building a general topic classification schema and an automatic classification method for consumer health questions in Chinese, for the purpose of facilitating users’ hypertension-related information needs analysis and answer extraction.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Collection</title>
        <p>We collected questions posted by health consumers from 1st January to 10th August, 2014, with the tags “hypertension (高血压)” or “blood pressure (血压)” under the Q&#38;A (有问必答) section on a Chinese health website with more than 35 million registered users [<xref ref-type="bibr" rid="ref27">27</xref>] and imported the data into a MySQL (MySQL Community Edition, Oracle) database. The resulting database included 98,032 messages, from which 2000 messages were randomly selected as the sample for analysis.</p>
        <p>In this study, “question” is defined as a request that a health consumer has posted on the website on a certain subject to elicit answers from physicians, which was identified based on meaning, not form. We focused on questions related to hypertension (<italic>高血压</italic>), which was sometimes expressed as “high blood pressure (<italic>高血压</italic>),” or simply as “high pressure (<italic>高压</italic>).” Therefore, we manually discarded messages that did not match the definition and that were irrelevant to hypertension but which contained similar words such as “high pressure oxygen (<italic>高压氧</italic>),” “hyperbaric cabin (<italic>高压舱</italic>),” “high voltage (<italic>高压电</italic>),” “pressure cooker (<italic>高压锅</italic>),” and so on. A new message was randomly selected from the database when an irrelevant message was discarded from the sample, so as to keep the sample size at 2000.</p>
        <p>The website provides a template for users to generate questions, which includes three fields: (1) describe your health status (<italic>病情描述</italic>), (2) treatments or tests in the past (<italic>曾经的治疗或检查情况</italic>), and (3) what kinds of help do you want (<italic>想得到怎样的帮助</italic>). This template might lead to confusion in customers regarding how to post their questions. To deal with this case, we developed a rule: if the phrase “what kinds of help do you want (<italic>想得到怎样的帮助</italic>)” was found in the message, then we would take the sentence after the phrase as the “question.” Otherwise, we would take the whole message as the “question.” By doing this, we collected 2000 questions with an average length of 48 words.</p>
      </sec>
      <sec>
        <title>Classification Schema and Corpus Construction</title>
        <p>A topic-based classification schema was developed based on TGCQ [<xref ref-type="bibr" rid="ref14">14</xref>] and the Layered Model of Context for Consumer Health Information Searching (LMCC) [<xref ref-type="bibr" rid="ref15">15</xref>], and some categories were divided into more specific sub-categories to code the specific information needs. We produced the annotations in 4 rounds (<xref ref-type="fig" rid="figure1">Figure 1</xref>). In round 1, one annotator (specialized in medical informatics) annotated all the 2000 sample questions, following the classification schema. Some categories were added to accommodate questions that did not fall into any existing specialty during the process. For purposes of consistency improvement among coders, and the usability of the classification, a list of annotation rules was developed and some question patterns were enumerated for even the smallest category. As a result, the preliminary classification schema for consumer health questions included 101 topic categories and 32 annotation rules.</p>
        <p>In round 2, four other annotators (two specialized in medicine and two specialized in informatics) independently annotated 200 questions randomly selected from the sample, using the classification schema. The authors compared the consistency of the five coding results (including the one in the first round) and categorized the 200 questions into three groups: (1) all annotators agreed (n=73), (2) only one disagreed (n=63), and (3) more than one disagreed (n=64). Then we focused on the last group. We addressed ambiguous elements by further specifying annotation rules and improving the descriptions of the question patterns.</p>
        <p>In round 3, the revised classification was distributed to the five annotators who independently annotated another 300 questions randomly selected from the remaining sample of 1800 messages. This step was done to measure the interrater reliability of the classification schema as well as to further modify it.</p>
        <p>In the last round, each of three annotators independently annotated 500 from the remaining 1500 messages. So each of the 2000 sample questions were annotated by at least two annotators. The authors compared the coding results and the disparities were discussed to achieve an agreement. The codes agreed upon during this step were regarded as the final schema. The number of questions in each category was calculated, and categories in which no questions were filled were deleted (such as physical characteristics of drugs, pharmacodynamics, and mechanism of drug action).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>A four-round annotating process to construct and modify the classification schema and annotated corpus.</p>
          </caption>
          <graphic xlink:href="jmir_v19i6e220_fig1.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Automatic Classification of the First-Level Topics</title>
        <p>The 2000 questions annotated by the above steps were used to train and test the classifiers for the primary level topics, including <italic>Diagnosis</italic>, <italic>Treatment</italic>, <italic>Condition Management</italic>, <italic>Healthy Lifestyle</italic>, and <italic>Health Provider Choice</italic>.</p>
        <sec>
          <title>Feature Selection</title>
          <p>We explored various features for machine-learning, including lexical, grammatical, semantic, and statistical information (<xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>).</p>
          <sec>
            <title>Lexical Features Such as Bag-of-Words and Part-of-Speech</title>
            <p>The word segmentation was obtained from Rwordseg [<xref ref-type="bibr" rid="ref28">28</xref>], a Chinese word segmentation tool under R environment based on the Chinese lexical analysis system, ICTCLAS, which reached a precision of 97.58% on the <italic>973</italic> experts testing [<xref ref-type="bibr" rid="ref29">29</xref>]. The Chinese part-of-speech tag was obtained by using the Stanford Parser (version 3.3.1) [<xref ref-type="bibr" rid="ref30">30</xref>].</p>
          </sec>
          <sec>
            <title>Grammatical Features Such as Interrogative Words, Noun Head Chunks, Verb Head Chunks, Noun Rear Chunks, Verb Rear Chunks, Interrogative Words + Noun or Verb Head Chunks, and Noun or Verb Rear Chunks + Interrogative Words</title>
            <p>We manually developed a dictionary of 42 Chinese interrogative words based on baike.baidu [<xref ref-type="bibr" rid="ref31">31</xref>] and general types of Chinese consumer questions summarized by our former research [<xref ref-type="bibr" rid="ref32">32</xref>]. In this study, the noun or verb head chunk is the first noun or verb after the first interrogative word in a question, and the noun or verb rear chunk is the last noun or verb before the first interrogative word. They are likely to be the dependent words of the interrogative word that help to express the semantic information in the question [<xref ref-type="bibr" rid="ref33">33</xref>].</p>
          </sec>
          <sec>
            <title>CMeSH Concepts and Semantic Types</title>
            <p>The controlled vocabulary of Chinese Medical Subject Headings (CMeSH) [<xref ref-type="bibr" rid="ref34">34</xref>] was applied to recognize the medical concepts and their semantic types (<italic>Disease</italic>, <italic>Drug</italic>, and <italic>Symptom</italic>) in the Chinese consumer health questions.</p>
          </sec>
          <sec>
            <title>Keywords</title>
            <p>These were a combination of lexical and statistical features. We used three ways to extract the keywords from a question: (1) the first <italic>k</italic> words of maximum term frequency (TF), (2) the first <italic>k</italic> words of maximum inverse-document frequency (IDF), and (3) the first <italic>k</italic> words of maximum TF-IDF. We adopted the heuristic equation (1) developed by Cao et al [<xref ref-type="bibr" rid="ref17">17</xref>] to calculate <italic>k</italic>, which was based on the observation that the number of keywords increases when the question length increases.</p>
          </sec>
          <sec>
            <title>Statistical Features</title>
            <p>These include question length, maximum, minimum, and average word length, maximum, minimum and average TF, maximum, minimum, and average IDF, and maximum, minimum and average TF-IDF. The corpus used to calculate the IDF of each word contained nearly 100 thousand hypertension-related messages that we had collected in our former research [<xref ref-type="bibr" rid="ref32">32</xref>]. The TF, IDF, and TF-IDF were computed by equations (2), (3), and (4), shown in <xref ref-type="fig" rid="figure2">Figure 2</xref>.</p>
            <fig id="figure2" position="float">
              <label>Figure 2</label>
              <caption>
                <p>Mathematical equations.</p>
              </caption>
              <graphic xlink:href="jmir_v19i6e220_fig2.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
            </fig>
            <p>As the feature space dimension was very large, and some of them could have degraded the performance of the classifiers, we adopted Φ-score to select the most discriminative features, which measures the discriminations in two sets of real numbers [<xref ref-type="bibr" rid="ref35">35</xref>]. Given the training vectors x<sub>s,</sub>, s=1,..., m, if the number of positive and negative instances are n+ and n-, respectively, the Φ-score of the t<sup>th</sup> feature is defined in equation (5) in <xref ref-type="fig" rid="figure2">Figure 2</xref>. The larger the Φ(t) is, the more likely this feature is more discriminative. Therefore, we used Φ(t) as the feature selection criterion, and the implementation steps were as follows:</p>
            <p>Calculate Φ(t) of every feature</p>
            <p>Calculate the avg Φ of each type of feature and, further, set it as the threshold of the corresponding feature type. The avg Φ was chosen as the feature selection threshold because the distribution of Φ differs greatly between different types of features, while this method can help to keep all the useful features in different types [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
            <p>For each type of machine-learning feature, select features with Φ ≥ avg Φ of this type.</p>
          </sec>
        </sec>
        <sec>
          <title>Classifiers</title>
          <p>Since a question can be assigned to multiple topics, the task in this paper was a multi-label classification problem, which was usually transformed into one or more single-label classification or regression problems [<xref ref-type="bibr" rid="ref37">37</xref>]. We therefore transformed the task into six binary classification problems (one-versus-rest for each) so as to suit the SVMs [<xref ref-type="bibr" rid="ref38">38</xref>], which were commonly used and claimed to be the best in related works [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref20">20</xref>]. We used machine-learning algorithms within the R project for statistical computing (version 3.3.1) for automatic question classification, including naive bayesian, SVMs, decision tree, maximum entropy, logistic regression, and conditional random fields. The results showed that SVMs performed the best among all the algorithms in 10-fold cross-validation.</p>
        </sec>
        <sec>
          <title>Training and Testing</title>
          <p>Due to the skewed distribution of consumer questions to different topics, an under-sampling method for the majority classes was applied to ensure that each classifier was trained and tested on the same number of “positive” and “negative” questions. We reported the classification performance using 10-fold cross-validation. The sample data for each binary classifier was equally divided into 10-folds: one of them was used as testing data, and the ramaining 9 folds as training data. The cross-validation process was repeated 10 times (equal to the folds) and the average value and standard deviation were reported. All cases in the sample data were used for both training and validation. Thus, each case was used for validation exactly once, which was the distinct advantage in this method [<xref ref-type="bibr" rid="ref39">39</xref>].</p>
        </sec>
      </sec>
      <sec>
        <title>Evaluation Metrics</title>
        <p>The interrater reliability of the classification schema was evaluated by the kappa statistic, which could correct agreement that occurred by chance. Kappa=(P<sub>o</sub>-P<sub>e</sub>)/(1-P<sub>e</sub>), where P<sub>o</sub> is the observed agreement and P<sub>e</sub> is the agreement expected by chance [<xref ref-type="bibr" rid="ref40">40</xref>]. When the number of categories was large, as in this study, P<sub>e</sub> would be close to zero, and the kappa value would be close to P<sub>o</sub> [<xref ref-type="bibr" rid="ref14">14</xref>]. Thus, we directly used P<sub>o</sub> as the kappa value. The bigger the kappa value, the better the agreement. We assume that when the user asked more than one question, it was acceptable to answer any one of them. Therefore, a liberal reliability criterion was used: a match was recorded if either the main or minor topics assigned by one annotator matched the other’s assignments.</p>
        <p>The performance of automatic classification methods was evaluated by precision (p), recall (r) and <italic>F</italic><sub>1</sub> score, all of which are commonly used as evaluation metrics for text categorization, and we report the average of each metric. Precision is the number of correctly classified cases divided by the total number of cases classified for the category; recall is the number of correctly classified cases divided by the total number of cases of that class; and <italic>F</italic><sub>1</sub> score is the harmonic mean of precision and recall, calculated as <italic>F</italic><sub>1</sub> =(2×p×r) / (p + r).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Classification Schema of Consumer Health Questions</title>
        <p>The final classification schema was a four-hierarchical-level of specificity, consisting of 48 quaternary categories (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>) and 35 annotation rules. The first level included seven areas, namely diagnosis, treatment, condition management, epidemiology, healthy lifestyle, health provider choice, and other. A branching structure of secondary, tertiary, and quaternary levels describes more specific topics of the questions than its upper level. One or more closely related question patterns were listed for each quaternary category. <xref ref-type="table" rid="table1">Table 1</xref> shows examples of consumer health questions in Chinese with their pattern and annotated tags on the topics of diagnosis and treatment, respectively.</p>
        <p>Table1. An example of consumer health questions in Chinese with their pattern and annotated tags.</p>
        <table-wrap position="float" id="table1">
          <table width="725" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="106"/>
            <col width="71"/>
            <col width="505"/>
            <thead>
              <tr valign="top">
                <td>General Topics</td>
                <td>Items</td>
                <td>Contents</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td rowspan="3">Diagnosis</td>
                <td>Question</td>
                <td>昨天不知道怎么事，突然感到心慌慌的，四肢发凉，全身冒冷汗，之后老婆扶我到小区医院那里去看，量了一下血压，血压比以往要高，之后医生叫我放松，休息了20分钟左右，又感觉没有什么事了。。 请问突然感觉到心慌，四肢发凉，血压升高，这是啥病啊? (Yesterday, my heart suddenly palpitated, my limbs became cold, and my whole body began to sweat. Then my wife accompanied me to the community hospital and checked my blood pressure; it was higher than before. The doctor told me to relax, and I feel much better after resting for about 20 minutes… suddenly felt flustered, limbs became cold, and blood pressure rose. What disease is it?)</td>
              </tr>
              <tr valign="top">
                <td>Pattern</td>
                <td>临床发现X1、X2、X3、……，这是啥病？(Clinical finding X1, X2, X3,… What disease is it?)</td>
              </tr>
              <tr valign="top">
                <td>Tag</td>
                <td>1.1.4.1 “诊断(Diagnosis)→病因/临床发现的解释(Interpretation of clinical finding)→不具体的发现或多种发现(Uncertain/multiple findings)”</td>
              </tr>
              <tr valign="top">
                <td rowspan="3">Treatment</td>
                <td>Question</td>
                <td>65岁老人血压高经常不稳定，吃哪种降压药最好？(A 65-year-old man with unsteady high blood pressure… What’s the best blood pressure drug to take?)</td>
              </tr>
              <tr valign="top">
                <td>Pattern</td>
                <td>病情y，吃/用/服用哪种药最好？(Condition y: What’s the best drug to take or use?)</td>
              </tr>
              <tr valign="top">
                <td>Tag</td>
                <td>2.1.2.1 “治疗(Treatment)→药物治疗(Drug therapy)→效力/适应症/药物选择(efficacy/indications/drug choosing)→治疗(Treatment)”</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>General Topics of Questions Asked by Health Consumers</title>
        <p>This study found that although health consumers would ask numerous health questions about themselves or their families, the general topics of the questions were limited to a small number and each category of the topics had its particular question patterns. The 2000 Chinese consumer health questions were annotated with 2000 major codes and 607 minor codes. The distribution of the sample questions on the primary level category is shown in <xref ref-type="table" rid="table2">Table 2</xref>. 26.35% of the questions were annotated with more than one topic, which demonstrated that health consumers tend to ask more than one question at a time and the question messages usually belong to multiple topic categories [<xref ref-type="bibr" rid="ref11">11</xref>] (<xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>). These findings indicated that the various consumer health questions could be represented by limited topics and keywords, and the task to classify those topics was a multi-label problem [<xref ref-type="bibr" rid="ref37">37</xref>].</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Distribution of the 2000 consumer health questions in Chinese on the primary level of topics.</p>
          </caption>
          <table width="750" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="66"/>
            <col width="203"/>
            <col width="66"/>
            <col width="57"/>
            <col width="130"/>
            <thead>
              <tr valign="top">
                <td>No.</td>
                <td>General Topics</td>
                <td>Positive</td>
                <td>Negative</td>
                <td>Total</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>Diagnosis</td>
                <td>600</td>
                <td>1400</td>
                <td>2000</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>Treatment</td>
                <td>1167</td>
                <td>833</td>
                <td>2000</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>Condition management</td>
                <td>136</td>
                <td>1864</td>
                <td>2000</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>Epidemiology</td>
                <td>233</td>
                <td>1767</td>
                <td>2000</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>Healthy lifestyle</td>
                <td>278</td>
                <td>1722</td>
                <td>2000</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>Health provider choice</td>
                <td>45</td>
                <td>1955</td>
                <td>2000</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>Other</td>
                <td>5</td>
                <td><break/></td>
                <td><break/></td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Total</td>
                <td>2000</td>
                <td>2000</td>
                <td>2000</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Interrater Reliability of the Classification Schema</title>
        <p>The kappa statistic for the five annotators was 0.63 in the quaternary level of the classification, indicating “substantial” reliability, better than in several similar studies, such as assigning topics to general clinical questions (kappa=0.53) [<xref ref-type="bibr" rid="ref14">14</xref>]. When only the primary and secondary levels were considered, the kappa value increased to 0.75. When only the seven broad areas in the primary level were considered, the kappa value was 0.82, slightly better than automatically classifying question types for consumer health questions in English conducted by Roberts et al [<xref ref-type="bibr" rid="ref20">20</xref>].</p>
      </sec>
      <sec>
        <title>Feature Selection for Automatic Question Classification</title>
        <p>The Φ-score of each feature was calculated for each binary classifier. We found that their distribution between different types of features differed greatly. The performance of classifiers using features with Φ ≥ avg Φ was not worse than that of those classifiers using all the features in the corresponding types, and some of them were even higher than the latter. Taking the topic of <italic>Lifestyle</italic> as an example, the average and standard deviation of Φ in each feature type are shown in the third and fourth columns in <xref ref-type="table" rid="table3">Table 3</xref>. The avg Φ of bag-of-words was 0.0016 with a standard deviation of 0.0067, while the values of keywords with maximum TF were 0.0008 and 0.0009, respectively. The average <italic>F</italic><sub>1</sub> score of the classifier was 74.08% when using all the 6154 features in part-of-speech, while the performance increased to 78.84% when just taking the 1490 features with Φ ≥ avg Φ (<xref ref-type="fig" rid="figure2">Figure 2</xref>). Similar cases can be seen in feature types of noun rear chunks, interrogative + noun or verb head chunks, verb rear chunks + interrogative, keywords with maximum TF, TF-IDF, and so on. The observations indicated that some of the features in each type either do nothing to the classifiers or have some side effects on them. Rejecting these features could not only save the computing resources so as to increase the efficiency, but also improve the performance of the classifiers.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Number and Φ distribution of each type of feature for the Chinese consumer health question classification on the topic of <italic>Lifestyle.</italic></p>
          </caption>
          <table width="595" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="66"/>
            <col width="203"/>
            <col width="66"/>
            <col width="57"/>
            <col width="38"/>
            <col width="80"/>
            <thead>
              <tr valign="top">
                <td>Levels</td>
                <td>Features Types<sup>a</sup></td>
                <td>Avg Φ</td>
                <td>σ (Φ)</td>
                <td>n<sub>AF</sub></td>
                <td>n<sub>(Φ ≥ avg Φ)</sub></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td rowspan="2">Lexical <break/><break/></td>
                <td>Bag-of-words</td>
                <td>0.0016</td>
                <td>0.0067</td>
                <td>4967</td>
                <td>1301</td>
              </tr>
              <tr valign="top">
                <td>Part-of-speech</td>
                <td>0.0014</td>
                <td>0.0060</td>
                <td>6154</td>
                <td>1490</td>
              </tr>
              <tr valign="top">
                <td rowspan="9">Grammatical <break/><break/><break/><break/><break/><break/><break/><break/><break/><break/><break/><break/><break/><break/><break/><break/></td>
                <td>Interrogative words</td>
                <td>0.0039</td>
                <td>0.0204</td>
                <td>97</td>
                <td>13</td>
              </tr>
              <tr valign="top">
                <td>Noun head chunks</td>
                <td>0.0011</td>
                <td>0.0010</td>
                <td>48</td>
                <td>14</td>
              </tr>
              <tr valign="top">
                <td>Verb head chunks</td>
                <td>0.0008</td>
                <td>0.0007</td>
                <td>19</td>
                <td>6</td>
              </tr>
              <tr valign="top">
                <td>Noun rear chunks</td>
                <td>0.0011</td>
                <td>0.0019</td>
                <td>73</td>
                <td>14</td>
              </tr>
              <tr valign="top">
                <td>Verb rear chunks</td>
                <td>0.0010</td>
                <td>0.0013</td>
                <td>22</td>
                <td>3</td>
              </tr>
              <tr valign="top">
                <td>Interrogative + noun head chunks</td>
                <td>0.0011</td>
                <td>0.0013</td>
                <td>328</td>
                <td>86</td>
              </tr>
              <tr valign="top">
                <td>Interrogative + verb head chunks</td>
                <td>0.0011</td>
                <td>0.0010</td>
                <td>312</td>
                <td>85</td>
              </tr>
              <tr valign="top">
                <td>Noun rear chunks + interrogative</td>
                <td>0.0010</td>
                <td>0.0013</td>
                <td>315</td>
                <td>67</td>
              </tr>
              <tr valign="top">
                <td>Verb rear chunks + interrogative</td>
                <td>0.0012</td>
                <td>0.0024</td>
                <td>318</td>
                <td>74</td>
              </tr>
              <tr valign="top">
                <td>Semantic</td>
                <td>CMeSH concepts</td>
                <td>0.0016</td>
                <td>0.0033</td>
                <td>43</td>
                <td>9</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>CMeSH semantic types</td>
                <td>0.0124</td>
                <td>0.0101</td>
                <td>3</td>
                <td>1</td>
              </tr>
              <tr valign="top">
                <td rowspan="3">Lexical &#38; Statistical <break/><break/></td>
                <td>Keywords (TF)</td>
                <td>0.0008</td>
                <td>0.0009</td>
                <td>1510</td>
                <td>282</td>
              </tr>
              <tr valign="top">
                <td>Keywords (IDF)</td>
                <td>0.0007</td>
                <td>0.0008</td>
                <td>1137</td>
                <td>192</td>
              </tr>
              <tr valign="top">
                <td>Keywords (TF-IDF)</td>
                <td>0.0008</td>
                <td>0.0008</td>
                <td>1208</td>
                <td>190</td>
              </tr>
              <tr valign="top">
                <td>Statistical</td>
                <td>Statistical features</td>
                <td>0.0073</td>
                <td>0.0060</td>
                <td>13</td>
                <td>5</td>
              </tr>
              <tr valign="top">
                <td><break/></td>
                <td>Total with duplicates replaced</td>
                <td><break/></td>
                <td><break/></td>
                <td>15349</td>
                <td>3656</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>For each type of feature, σ (Φ) is the standard deviation of Φ, n<sub>AF</sub> is the total number of features, n (Φ ≥ avg Φ) is the number of features with Φ ≥ avg Φ.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Therefore, the features with Φ ≥ avg Φ in every feature type were selected as input features for machine-learning, in order to keep all the useful features in different types and to improve the performance of the classifiers. Thus, each classifier received a different feature set, and the number of features within them are showed in the third column in <xref ref-type="table" rid="table4">Table 4</xref>. For example, words such as “<italic>drinking</italic> (饮 酒),” “<italic>eat a meal</italic> (吃 饭),” “<italic>breakfast</italic> (早餐),” “<italic>stay up late</italic> (熬夜),” “<italic>weight</italic> (体重),”  “<italic>daily life</italic> (平时),” “<italic>nurse one’s health</italic> (调理),” and so on were the effective bag-of-words features for the classifier for <italic>Healthy Lifestyle</italic> but not effective for the classifier for <italic>Diagnosis</italic>. On the contrary, words such as “<italic>diagnose</italic> (诊断),” “<italic>judge</italic> (判断),” “<italic>indicate</italic> (提示),” “<italic>physical examination</italic> (查体),” “<italic>cardiac murmur</italic> (杂音),” “<italic>head rush</italic> (脑充血),” “<italic>dazed</italic> (昏沉沉),” and so on were the effective bag-of-words features for the classifier for <italic>Diagnosis</italic> but not effective for the classifier for <italic>Healthy Lifestyle</italic>.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Feature reduction and the performance of each classifier.</p>
          </caption>
          <table width="569" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="152"/>
            <col width="71"/>
            <col width="71"/>
            <col width="80"/>
            <col width="48"/>
            <col width="61"/>
            <thead>
              <tr valign="top">
                <td>General topics</td>
                <td>N (all features)</td>
                <td>N (selected features)</td>
                <td>Feature reduction proportion</td>
                <td>Avg <italic>F</italic><sub>1</sub></td>
                <td>σ (<italic>F</italic><sub>1</sub>)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Diagnosis</td>
                <td>15349</td>
                <td>5311</td>
                <td>0.6540</td>
                <td>0.9855</td>
                <td>0.0164</td>
              </tr>
              <tr valign="top">
                <td>Treatment</td>
                <td>15349</td>
                <td>4216</td>
                <td>0.7253</td>
                <td>0.7602</td>
                <td>0.0482</td>
              </tr>
              <tr valign="top">
                <td>Condition management</td>
                <td>15349</td>
                <td>3150</td>
                <td>0.7948</td>
                <td>0.9963</td>
                <td>0.0117</td>
              </tr>
              <tr valign="top">
                <td>Epidemiology</td>
                <td>15349</td>
                <td>4194</td>
                <td>0.7268</td>
                <td>0.7177</td>
                <td>0.0798</td>
              </tr>
              <tr valign="top">
                <td>Healthy lifestyle</td>
                <td>15349</td>
                <td>3656</td>
                <td>0.7618</td>
                <td>0.9913</td>
                <td>0.0166</td>
              </tr>
              <tr valign="top">
                <td>Health provider choice</td>
                <td>15349</td>
                <td>2282</td>
                <td>0.8513</td>
                <td>0.9635</td>
                <td>0.0594</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Performance of each feature type for Chinese consumer health question classification on the topic of Lifestyle.</p>
          </caption>
          <graphic xlink:href="jmir_v19i6e220_fig3.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Performance improvement of each classifier by selecting features above the threshold.</p>
          </caption>
          <graphic xlink:href="jmir_v19i6e220_fig4.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Performance of the Automatic Classification Methods</title>
        <p>The results were obtained from SVMs in the kernlab package because it performed the best among all the classification algorithms available in the R project. The research findings showed that the feature spaces were reduced from 65.40% to 85.13% by dropping features under the threshold (<xref ref-type="table" rid="table4">Table 4</xref>). Furthermore, the performance of each classifier also improved significantly (<xref ref-type="fig" rid="figure3">Figure 3</xref>). For example, the average <italic>F</italic><sub>1</sub> score of the classifier for <italic>Diagnosis</italic> dramatically increased from 79.84% to 98.55%, while the feature space reduced from 15349 to 5311 (reduced 65.40%). The feature space of the classifier for Treatment reduced greatly (Down from 15349 to 4216, reduced 72.53%), although the improvement of performance was not so obvious (F1 score increased from 75.82% to 76.02%). The results of 10-fold cross validation on each binary classifier affirmed the hypothesis we proposed in the Feature Selection sections.</p>
        <p>The performance on the classification of most topics of consumer health questions in Chinese was high. The evaluation metrics (average precision, recall, and <italic>F</italic><sub>1</sub> score) of <italic>Diagnosis, Condition Management, Healthy Lifestyle, and Health Provider Choice</italic> were above 95%, while, the metrics of <italic>Treatment</italic> and <italic>Epidemiology</italic> were 76.02% and 71.77%, which were relatively weaker than the others. The standard deviation indicated that the performance of each binary classifier was relatively robust. As of 6-category classification results, we achieved an average precision of 91.41%, recall of 89.62%, and <italic>F</italic><sub>1</sub> score of 90.24%.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>A classification schema of consumer health questions was built in this study and 2000 hypertension-related consumer health questions in Chinese were manually annotated based on this schema. The research findings demonstrated that health consumers were mainly concerned about what was wrong with their health (or the health of someone they cared about), why it was wrong, how to treat it (including choosing which provider to treat), whether the drugs they used had adverse effects or would do harm in some conditions (eg, pregnancy, breast feeding), whether they could recover from the illness, and what they could do to improve their health in everyday life (mainly diet suggestions).</p>
        <p>We explored a machine-learning method to automatically classify these Chinese consumer health questions into one of the six primary level topics, with a novel scoring metric to select the most effective features from the abundant feature types we had explored. The results proved that selecting the features with Φ ≥ avg Φ in each feature type as input features for machine- learning not only increased the efficiency, but also improved the performance of the classifiers successfully. From the 6-category classification results, we achieved an average precision of 91.41%, recall of 89.62%, and <italic>F</italic><sub>1</sub> score of 90.24%.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <sec>
          <title>Similarities and Differences in Questions Asked by Health Consumers and Providers</title>
          <p>Compared with the 1396 clinical questions annotated by Ely et al [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref41">41</xref>], we found that while health consumers and providers both asked questions about diagnosis, treatment, condition management, and epidemiology, the questions posted by consumers were much more ambiguous. For instance, the frequency of questions with multiple findings was twice that of health providers’ inquiries under the category of interpretation of clinical findings. It might be because consumers could not identify the most important findings, so they tended to list all the findings they knew. Although the frequency of treatment questions was almost equal in the two groups, health providers’ questions were more specific to drug therapy (37.2% vs 22.1%), and they sometimes asked these questions on very specialized topics, such as composition, pharmacodynamics, action mechanism, and serum levels of drugs [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]. Such questions were rarely asked by health consumers. Moreover, health consumers would ask how to keep healthy or help in recovery in daily life, because many of them have recognized that lifestyle factors, such as diet, exercise, weight loss, and mood control, would impact their health status as well [<xref ref-type="bibr" rid="ref42">42</xref>]. However, physicians seldom asked these questions during a patient encounter, possibly because they mainly focused on medical service rather than lifestyle advice [<xref ref-type="bibr" rid="ref10">10</xref>]. Similarly, health consumers never asked questions about coordination with other providers, doctor-patient communication, doctor and patient education, administrative rules, ethics, and legal issues, because these tasks were usually regarded as health providers' responsibility. These findings affirmed again that, health consumers’ information needs differed significantly from those of providers. Therefore, the existing classification schemas and automatic classification methods for clinical questions cannot be applied to consumer health questions directly [<xref ref-type="bibr" rid="ref11">11</xref>].</p>
        </sec>
        <sec>
          <title>Features Explored for Automatic Classifiers</title>
          <p>Compared with other related studies on automatic question classification in the domain of health and medicine, we explored an abundant number of feature types for automatic classifiers. For example, Cao et al [<xref ref-type="bibr" rid="ref17">17</xref>] explored the features of bag-of-words, n-grams, part-of-speech, UMLS concepts, and semantic types, as well as IDF to identify general topics of clinical questions. Patrick et al [<xref ref-type="bibr" rid="ref18">18</xref>] used bag-of-words, Bigram, interrogative words, SNOMED category, verb and its subject, and verb and its object as feature sets to distinguish answerable and unanswerable ICU questions. Liu et al [<xref ref-type="bibr" rid="ref19">19</xref>] picked bag-of-words, word length, question length, IDF, interrogative words, personal pronouns, indefinite pronouns, and auxiliary verbs as learning features to separate consumer questions from professional questions in the health domain. Roberts et al [<xref ref-type="bibr" rid="ref20">20</xref>] explored the features of bag-of-words, part-of-speech, UMLS concepts, named entity, word length, IDF, and noun and verb head chunks to classify question types for consumer health questions in English, while Conway et al [<xref ref-type="bibr" rid="ref43">43</xref>] used bag-of-words, n-grams, semantic UMLS types, and named entity as features to classify disease outbreak reports. In other words, bag-of-words, part-of-speech, and semantic types were the most commonly used features for question classification. Our work adopted all the effective features in the prior works with the UMLS concepts and semantic types replaced by CMeSH concepts and semantic types. We also explored three ways to extract the keywords from a question using the machine-learning features, that is, we took the first <italic>k</italic> words with maximum TF, IDF, or TF-IDF as keywords. In addition, we added noun or verb rear chunks + interrogative words according to the specialties of word order in the Chinese language. The results showed that it worked better than the interrogative words + noun or verb head chunks, which was commonly used for question classification in English.</p>
        </sec>
        <sec>
          <title>Feature Selection for Automatic Question Classification</title>
          <p>The feature selection methods in our work were quite different from other relative works, and it has proved that our methods were much more effective and easy. Cao et al [<xref ref-type="bibr" rid="ref17">17</xref>], Liu et al [<xref ref-type="bibr" rid="ref19">19</xref>], and Roberts et al [<xref ref-type="bibr" rid="ref20">20</xref>]employed a method of combining different types of features without considering the threshold, in which they explored different combinations of different feature types and selected the best combination with the maximum <italic>F</italic><sub>1</sub> score of the classifier. Thus, a feature type would be either picked up or rejected in their approach, which may have caused the loss of some effective features. Another disadvantage of this method was the difficulty in exploring all the possible combinations of different feature types. On the contrary, we adopted a much more efficient method to combine all the effective features from each feature type with Φ ≥ avg Φ, which was also proved to be very effective (as described in the results section).</p>
        </sec>
        <sec>
          <title>Performance of the Classifiers</title>
          <p>The performance of the classifiers trained by our study was quite satisfying. The average <italic>F</italic><sub>1</sub> scores for the four classifiers for <italic>Condition management, Health lifestyle, Diagnosis, and Health provider choice</italic> were 99.63%, 99.13%, 98.55%, and 96.35%, respectively. The results were more significant than those of other similar studies. For example, the classification of 13 general topics of clinical questions conducted by Cao et al [<xref ref-type="bibr" rid="ref17">17</xref>], which reached the highest <italic>F</italic><sub>1</sub> score (89.3%) on the classifier for <italic>Pharmacology</italic>, while the majority of the scores were between 70% and 80%, and the classification of 13 question types of consumer questions carried out by Roberts et al [<xref ref-type="bibr" rid="ref20">20</xref>], which achieved the highest <italic>F</italic><sub>1</sub> score (90.6%) on the classifier for <italic>Management</italic>, with 5 between 80% and 90%, and 5 below 70%. It is worth noting that the methods proposed in this paper and those in the related works were experimented on different datasets in different languages. Further, there were two main reasons for the differences between this study and others, although the same algorithm of SVMs was used. On the one hand, the feature types and the feature selection methods applied in this study were more efficient and effective (as discussed above); on the other hand, the classification schema used in this study was more distinguishable. For example, questions about <italic>Etiology</italic> or <italic>Cause</italic> and <italic>Diagnosis</italic> were very similar and always asked together. Thus, they were annotated as one topic (<italic>Diagnosis)</italic> in our study. However, Cao et al [<xref ref-type="bibr" rid="ref17">17</xref>] and Roberts et al [<xref ref-type="bibr" rid="ref20">20</xref>] annotated them as different types.</p>
        </sec>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>One of the limitations of this work is that the sample questions we used to build the classification schema and to train the automatic classifiers were from only one Chinese health website and defined to be hypertension or blood pressure related. Therefore, the applicability of the classification schema and the validity of the automatic classifiers for the vast majority of questions from other websites and other diseases remain to be tested. Another limitation of this work is that some types of features, such as keywords and bag-of-words, might be correlated. However, our feature selection algorithm did not take the impact of correlation into consideration. We only reached moderate performances on the automatic classifiers for the general topics of Treatment and Epidemiology, whereas the reasons for this remain to be explored in the future.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>One of the specialties of this research was that Chinese consumer health questions were chosen as the research object. We built a classification schema of consumer health questions which consisted of 48 quaternary categories and 35 annotation rules, and we annotated 2000 questions in Chinese that were randomly selected from nearly 100 thousand messages about hypertension. Then, by using these annotated questions as the corpus, we explored a machine-learning method to automatically classify Chinese consumer health questions into six general topics to facilitate users’ information needs analysis and answer extraction. We explored an abundant number of feature types and adopted a novel method to select all the effective features with Φ ≥ avg Φ. The results proved that our classification approach was relatively more efficient and effective as compared with similar studies.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>Supplementary tables.</p>
        <media xlink:href="jmir_v19i6e220_app1.pdf" xlink:title="PDF File (Adobe PDF File), 53KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">TGCQ</term>
          <def>
            <p>Taxonomies of Generic Clinical Questions</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">LMCC</term>
          <def>
            <p>Layered Model of Context for Consumer Health Information Searching</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This research was supported by the Chinese Academy of Medical Sciences (Grant No. 2016ZX330011) and the National Social Science Foundation of China (Grant No. 14BTQ032). The authors would like to thank Dr Chao Xu for his helpful suggestions on data processing.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web"> <person-group person-group-type="author"> <collab>China Internet Network Information Center</collab> </person-group> <source>cnnic</source> <year>2016</year> <comment>China internet network development state statistic report<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.cnnic.net.cn/hlwfzyj/hlwxzbg/201601/P020160122469130059846.pdf">http://www.cnnic.net.cn/hlwfzyj/hlwxzbg/201601/P020160122469130059846.pdf</ext-link> </comment> </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Fox</surname> 
        <given-names>S</given-names></name> </person-group>
        <source>Pew Research Center</source> 
        <year>2011</year> 
        <comment>The social life of health information
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pewinternet.org/files/old-media/Files/Reports/2011/PIP_Social_Life_of_Health_Info.pdf">http://www.pewinternet.org/files/old-media/Files/Reports/2011/PIP_Social_Life_of_Health_Info.pdf</ext-link></comment> </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <source>d.wanfangdata</source>  
        <year>2011</year>  
        <access-date>2017-05-27</access-date>
        <comment>Empirical research on impact of internet use on individual health behaviors 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://d.wanfangdata.com.cn/Thesis/D186454">http://d.wanfangdata.com.cn/Thesis/D186454</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6qlZYIitE"/></comment> </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>AT</given-names>
          </name>
        </person-group>
        <article-title>The Relationship between health management and information behavior over time: a study of the illness journeys of people living with fibromyalgia</article-title>
        <source>J Med Internet Res</source>  
        <year>2016</year>  
        <month>10</month>  
        <day>25</day>  
        <volume>18</volume>  
        <issue>10</issue>  
        <fpage>e269</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2016/10/e269/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.5309</pub-id>
        <pub-id pub-id-type="medline">27780794</pub-id>
        <pub-id pub-id-type="pii">v18i10e269</pub-id>
        <pub-id pub-id-type="pmcid">PMC5101414</pub-id></nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Fiksdal</surname>
            <given-names>AS</given-names>
          </name>
          <name name-style="western">
            <surname>Kumbamu</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Jadhav</surname>
            <given-names>AS</given-names>
          </name>
          <name name-style="western">
            <surname>Cocos</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Nelsen</surname>
            <given-names>LA</given-names>
          </name>
          <name name-style="western">
            <surname>Pathak</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>McCormick</surname>
            <given-names>JB</given-names>
          </name>
        </person-group>
        <article-title>Evaluating the process of online health information searching: a qualitative approach to exploring consumer perspectives</article-title>
        <source>J Med Internet Res</source>  
        <year>2014</year>  
        <volume>16</volume>  
        <issue>10</issue>  
        <fpage>e224</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2014/10/e224/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/jmir.3341</pub-id>
        <pub-id pub-id-type="medline">25348028</pub-id>
        <pub-id pub-id-type="pii">v16i10e224</pub-id>
        <pub-id pub-id-type="pmcid">PMC4285658</pub-id></nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zeng</surname>
            <given-names>QT</given-names>
          </name>
          <name name-style="western">
            <surname>Kogan</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Plovnick</surname>
            <given-names>RM</given-names>
          </name>
          <name name-style="western">
            <surname>Crowell</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Lacroix</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Greenes</surname>
            <given-names>RA</given-names>
          </name>
        </person-group>
        <article-title>Positive attitudes and failed queries: an exploration of the conundrums of consumer health information retrieval</article-title>
        <source>Int J Med Inform</source>  
        <year>2004</year>  
        <month>02</month>  
        <volume>73</volume>  
        <issue>1</issue>  
        <fpage>45</fpage>  
        <lpage>55</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2003.12.015</pub-id>
        <pub-id pub-id-type="medline">15036078</pub-id>
        <pub-id pub-id-type="pii">S1386505603002211</pub-id></nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Mao</surname>
            <given-names>XL</given-names>
          </name>
          <name name-style="western">
            <surname>LI</surname>
            <given-names>XM</given-names>
          </name>
        </person-group>
        <article-title>A survey on question and answering systems</article-title>
        <source>Journal of Frontiers of Computer Science and Technology</source>  
        <year>2012</year>  
        <volume>6</volume>  
        <issue>3</issue>  
        <fpage>193</fpage>  
        <lpage>207</lpage> </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhen</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Overview on question classification in question-answering system</article-title>
        <source>Journal of Anhui University of Technology (Natural Science)</source>  
        <year>2015</year>  
        <volume>32</volume>  
        <issue>1</issue>  
        <fpage>48</fpage>  
        <lpage>54</lpage> </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Boot Cécile</surname>
            <given-names>RL</given-names>
          </name>
          <name name-style="western">
            <surname>Meijman</surname>
            <given-names>FJ</given-names>
          </name>
        </person-group>
        <article-title>Classifying health questions asked by the public using the ICPC-2 classification and a taxonomy of generic clinical questions: an empirical exploration of the feasibility</article-title>
        <source>Health Commun</source>  
        <year>2010</year>  
        <month>03</month>  
        <volume>25</volume>  
        <issue>2</issue>  
        <fpage>175</fpage>  
        <lpage>81</lpage>  
        <pub-id pub-id-type="doi">10.1080/10410230903544969</pub-id>
        <pub-id pub-id-type="medline">20390683</pub-id>
        <pub-id pub-id-type="pii">919824679</pub-id></nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Reeder</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Le</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Thompson</surname>
            <given-names>HJ</given-names>
          </name>
          <name name-style="western">
            <surname>Demiris</surname>
            <given-names>G</given-names>
          </name>
        </person-group>
        <article-title>Comparing information needs of health care providers and older adults: findings from a wellness study</article-title>
        <source>Stud Health Technol Inform</source>  
        <year>2013</year>  
        <volume>192</volume>  
        <fpage>18</fpage>  
        <lpage>22</lpage>  
        <pub-id pub-id-type="medline">23920507</pub-id>
        <pub-id pub-id-type="pmcid">PMC4362702</pub-id></nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Roberts</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Demner-Fushman</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Interactive use of online health resources: a comparison of consumer and professional questions</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2016</year>  
        <month>07</month>  
        <volume>23</volume>  
        <issue>4</issue>  
        <fpage>802</fpage>  
        <lpage>11</lpage>  
        <pub-id pub-id-type="doi">10.1093/jamia/ocw024</pub-id>
        <pub-id pub-id-type="medline">27147494</pub-id>
        <pub-id pub-id-type="pii">ocw024</pub-id>
        <pub-id pub-id-type="pmcid">PMC4926747</pub-id></nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gebel</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Okkes</surname>
            <given-names>I</given-names>
          </name>
        </person-group>
        <source>International classification of primary care (ICPC-2-NL)</source>  
        <year>2000</year>  
        <publisher-loc>United Kingdom</publisher-loc>
        <publisher-name>Oxford University Press</publisher-name></nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Schnall</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Cimino</surname>
            <given-names>JJ</given-names>
          </name>
          <name name-style="western">
            <surname>Currie</surname>
            <given-names>LM</given-names>
          </name>
          <name name-style="western">
            <surname>Bakken</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>Information needs of case managers caring for persons living with HIV</article-title>
        <source>J Am Med Inform Assoc</source>  
        <year>2011</year>  
        <month>05</month>  
        <day>01</day>  
        <volume>18</volume>  
        <issue>3</issue>  
        <fpage>305</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21270131"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1136/jamia.2010.006668</pub-id>
        <pub-id pub-id-type="medline">21270131</pub-id>
        <pub-id pub-id-type="pii">jamia.2010.006668</pub-id>
        <pub-id pub-id-type="pmcid">PMC3078676</pub-id></nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ely</surname>
            <given-names>JW</given-names>
          </name>
          <name name-style="western">
            <surname>Osheroff</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Gorman</surname>
            <given-names>PN</given-names>
          </name>
          <name name-style="western">
            <surname>Ebell</surname>
            <given-names>MH</given-names>
          </name>
          <name name-style="western">
            <surname>Chambliss</surname>
            <given-names>ML</given-names>
          </name>
          <name name-style="western">
            <surname>Pifer</surname>
            <given-names>EA</given-names>
          </name>
          <name name-style="western">
            <surname>Stavri</surname>
            <given-names>PZ</given-names>
          </name>
        </person-group>
        <article-title>A taxonomy of generic clinical questions: classification study</article-title>
        <source>Br Med J</source>  
        <year>2000</year>  
        <month>08</month>  
        <day>12</day>  
        <volume>321</volume>  
        <issue>7258</issue>  
        <fpage>429</fpage>  
        <lpage>32</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pubmedcentral.nih.gov/articlerender.fcgi?artid=27459&#38;tool=pmcentrez&#38;rendertype=abstract"/>
        </comment>  
        <pub-id pub-id-type="medline">10938054</pub-id>
        <pub-id pub-id-type="pmcid">PMC27459</pub-id></nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yan</surname>
            <given-names>Z</given-names>
          </name>
        </person-group>
        <article-title>Toward a layered model of context for health information searching: an analysis of consumer-generated questions</article-title>
        <source>J Am Soc Inf Sci Technol</source>  
        <year>2013</year>  
        <volume>64</volume>  
        <issue>6</issue>  
        <fpage>1158</fpage>  
        <lpage>72</lpage>  
        <pub-id pub-id-type="doi">10.1002/asi.22821</pub-id></nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Roberts</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Masterton</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Fiszman</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <source>Citeseerx.ist</source>  
        <year>2014</year>  
        <access-date>2017-05-27</access-date>
        <comment>Annotating question types for consumer health questions 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://citeseerx.ist.psu.edu/viewdoc/download;jsessionid=9DE05B71F8A3E344512A3366E516A1B8?doi=10.1.1.673.6987&#38;rep=rep1&#38;type=pdf">http://citeseerx.ist.psu.edu/viewdoc/download;jsessionid=9DE05B71F8A3E344512A3366E516A1B8?doi=10.1.1.673.6987&#38;rep=rep1&#38;type=pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6qlbO0DdO"/></comment> </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Cao</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Cimino</surname>
            <given-names>JJ</given-names>
          </name>
          <name name-style="western">
            <surname>Ely</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Automatically extracting information needs from complex clinical questions</article-title>
        <source>J Biomed Inform</source>  
        <year>2010</year>  
        <month>12</month>  
        <volume>43</volume>  
        <issue>6</issue>  
        <fpage>962</fpage>  
        <lpage>71</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(10)00106-1"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2010.07.007</pub-id>
        <pub-id pub-id-type="medline">20670693</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(10)00106-1</pub-id>
        <pub-id pub-id-type="pmcid">PMC2991382</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Patrick</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>An ontology for clinical questions about the contents of patient notes</article-title>
        <source>J Biomed Inform</source>  
        <year>2012</year>  
        <month>04</month>  
        <volume>45</volume>  
        <issue>2</issue>  
        <fpage>292</fpage>  
        <lpage>306</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(11)00196-1"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2011.11.008</pub-id>
        <pub-id pub-id-type="medline">22142949</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(11)00196-1</pub-id></nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Antieau</surname>
            <given-names>LD</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Toward automated consumer question answering: automatically separating consumer questions from professional questions in the healthcare domain</article-title>
        <source>J Biomed Inform</source>  
        <year>2011</year>  
        <month>12</month>  
        <volume>44</volume>  
        <issue>6</issue>  
        <fpage>1032</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(11)00135-3"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2011.08.008</pub-id>
        <pub-id pub-id-type="medline">21856442</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(11)00135-3</pub-id>
        <pub-id pub-id-type="pmcid">PMC3226885</pub-id></nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Roberts</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Kilicoglu</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Fiszman</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Demner-Fushman</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Automatically classifying question types for consumer health questions</article-title>
        <source>AMIA Annu Symp Proc</source>  
        <year>2014</year>  
        <volume>2014</volume>  
        <fpage>1018</fpage>  
        <lpage>27</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25954411"/>
        </comment>  
        <pub-id pub-id-type="medline">25954411</pub-id>
        <pub-id pub-id-type="pmcid">PMC4420005</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Zhu</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>A review of Chinese Q &#38; A system questions</article-title>
        <source>Technology Intelligence Engineering</source>  
        <year>2016</year>  
        <fpage>01</fpage>  
        <lpage>42</lpage> </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Lei</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>H</given-names>
          </name>
        </person-group>
        <article-title>Named entity recognition in Chinese clinical text using deep neural network</article-title>
        <source>Stud Health Technol Inform</source>  
        <year>2015</year>  
        <volume>216</volume>  
        <fpage>624</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26262126"/>
        </comment>  
        <pub-id pub-id-type="medline">26262126</pub-id>
        <pub-id pub-id-type="pmcid">PMC4624324</pub-id></nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zeng</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Z</given-names>
          </name>
        </person-group>
        <article-title>Extracting clinical information from free-text of pathology and operation notes via Chinese natural language processing</article-title>
        <year>2010</year>  
        <month>12</month>  
        <day>1</day>  
        <conf-name>IEEE International Conference on Bioinformatics and Biomedicine Workshops (BIBMW)</conf-name>
        <conf-date>2010</conf-date>
        <conf-loc>Hong Kong</conf-loc>
        <fpage>593</fpage>  
        <lpage>597</lpage> </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>W</given-names>
          </name>
          <name name-style="western">
            <surname>Zeng</surname>
            <given-names>Q</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Z</given-names>
          </name>
          <name name-style="western">
            <surname>Feng</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>L</given-names>
          </name>
        </person-group>
        <article-title>Extracting important information from Chinese Operation Notes with natural language processing methods</article-title>
        <source>J Biomed Inform</source>  
        <year>2014</year>  
        <month>04</month>  
        <volume>48</volume>  
        <fpage>130</fpage>  
        <lpage>6</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(14)00006-9"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2013.12.017</pub-id>
        <pub-id pub-id-type="medline">24486562</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(14)00006-9</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Kang</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Wen</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Elhadad</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Lei</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Speculation detection for Chinese clinical notes: impacts of word segmentation and embedding models</article-title>
        <source>J Biomed Inform</source>  
        <year>2016</year>  
        <month>04</month>  
        <volume>60</volume>  
        <fpage>334</fpage>  
        <lpage>41</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(16)00033-2"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1016/j.jbi.2016.02.011</pub-id>
        <pub-id pub-id-type="medline">26923634</pub-id>
        <pub-id pub-id-type="pii">S1532-0464(16)00033-2</pub-id>
        <pub-id pub-id-type="pmcid">PMC5282586</pub-id></nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <collab>National Center for Cardiovascular Diseases of China</collab>
        </person-group>
        <source>Report on cardiovascular diseases in China (2013)</source>  
        <year>2014</year>  
        <publisher-loc>Beijing</publisher-loc>
        <publisher-name>Beijing Encyclopedia of China Publishing House</publisher-name></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>XYWY</collab>
        </person-group>
        <source>XYWY</source>  
        <year>2016</year>  
        <access-date>2017-05-27</access-date>
        <comment>Trustworthy Internet Healthcare Service Platform 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.xywy.com/about/index.html">http://www.xywy.com/about/index.html</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6qldIeXre"/></comment> </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <source>Csdn.net</source>  
        <year>2016</year>  
        <access-date>2017-05-27</access-date>
        <comment>Introduction of Rwordseg 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://download.csdn.net/detail/cl1143015961/8436741">http://download.csdn.net/detail/cl1143015961/8436741</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6qleBRsFs"/></comment> </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
        <source>sewm.pku</source> 
        <comment>ICTCLAS: Institute of Computing Technology, Chinese Lexical Analysis System
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://sewm.pku.edu.cn/QA/reference/ICTCLAS/FreeICTCLAS/">http://sewm.pku.edu.cn/QA/reference/ICTCLAS/FreeICTCLAS/</ext-link></comment> </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="web">
        <source>nlp.stanford</source> 
        <comment>Stanford Log-linear Part-Of-Speech Tagger
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://nlp.stanford.edu/software/tagger.shtml">https://nlp.stanford.edu/software/tagger.shtml</ext-link></comment> </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
        <source>baike.baidu</source>  
        <access-date>2017-05-27</access-date>
        <comment>Question words 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://baike.baidu.com/item/%E7%96%91%E9%97%AE%E8%AF%8D">http://baike.baidu.com/item/%E7%96%91%E9%97%AE%E8%AF%8D</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6qle8GlKD"/></comment> </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Guo</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Dai</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>Consumer health information needs and question classification: analysis of hypertension related questions asked by consumers on a Chinese health website</article-title>
        <source>Stud Health Technol Inform</source>  
        <year>2015</year>  
        <volume>216</volume>  
        <fpage>810</fpage>  
        <lpage>4</lpage>  
        <pub-id pub-id-type="medline">26262164</pub-id></nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Niu</surname>
            <given-names>YQ</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Duan</surname>
            <given-names>LG</given-names>
          </name>
        </person-group>
        <article-title>Study on classification features of Chinese interrogatives</article-title>
        <source>Computer Application and Software</source>  
        <year>2012</year>  
        <volume>29</volume>  
        <issue>3</issue>  
        <fpage>108</fpage>  
        <lpage>111</lpage> </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sun</surname>
            <given-names>HX</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>JL</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>DY</given-names>
          </name>
        </person-group>
        <article-title>The study on semantic mapping from free word to subject headings based on semantic system of CMeSH</article-title>
        <source>Data analysis and knowledge discovery</source>  
        <year>2013</year>  
        <volume>29</volume>  
        <issue>11</issue>  
        <fpage>46</fpage>  
        <lpage>51</lpage>  
        <pub-id pub-id-type="doi">10.11925/infotech.1003-3513.2013.11.07</pub-id></nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>YW</given-names>
          </name>
          <name name-style="western">
            <surname>Lin</surname>
            <given-names>CJ</given-names>
          </name>
        </person-group>
        <article-title>Combining SVMs with various feature selection strategies</article-title>
        <source>Studies in Fuzziness and Soft Computing</source>  
        <year>2006</year>  
        <publisher-loc>Berlin, Heidelberg</publisher-loc>
        <publisher-name>Springer</publisher-name>
        <fpage>315</fpage>  
        <lpage>24</lpage> </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>L</given-names>
          </name>
          <name name-style="western">
            <surname>Li</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Yao</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Wu</surname>
            <given-names>X</given-names>
          </name>
        </person-group>
        <article-title>[A P300 detection algorithm based on F-score feature selection and support vector machines]</article-title>
        <source>Sheng Wu Yi Xue Gong Cheng Xue Za Zhi</source>  
        <year>2008</year>  
        <month>02</month>  
        <volume>25</volume>  
        <issue>1</issue>  
        <fpage>23</fpage>  
        <lpage>6, 52</lpage>  
        <pub-id pub-id-type="medline">18435249</pub-id></nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Tsoumakas</surname> 
        <given-names>G</given-names></name> 
        <name name-style="western">
        <surname>Katakis</surname> 
        <given-names>I</given-names></name> </person-group>
        <source>lpis.csd</source> 
        <year>2016</year> 
        <comment>Multi-label classification: an overview
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://lpis.csd.auth.gr/publications/tsoumakas-ijdwm.pdf">http://lpis.csd.auth.gr/publications/tsoumakas-ijdwm.pdf</ext-link></comment> </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gou</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>X</given-names>
          </name>
        </person-group>
        <article-title>SVM multi-class classification</article-title>
        <source>Journal of Data Acquisition &#38; Processing</source>  
        <year>2006</year>  
        <volume>21</volume>  
        <issue>3</issue>  
        <fpage>334</fpage>  
        <lpage>339</lpage> </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="web">
        <source>Wikipedia</source> 
        <comment>Cross-validation (statistics)
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://en.wikipedia.org/wiki/Cross-validation_(statistics).pdf">https://en.wikipedia.org/wiki/Cross-validation_(statistics).pdf</ext-link></comment> </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="book">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Elliott</surname>
            <given-names>AC</given-names>
          </name>
          <name name-style="western">
            <surname>Woodward</surname>
            <given-names>WA</given-names>
          </name>
        </person-group>
        <source>Statistical analysis quick reference guidebook: with SPSS examples</source>  
        <year>2006</year>  
        <publisher-loc>United States</publisher-loc>
        <publisher-name>SAGE Publications, Inc</publisher-name></nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ely</surname>
            <given-names>JW</given-names>
          </name>
          <name name-style="western">
            <surname>Osheroff</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Ebell</surname>
            <given-names>MH</given-names>
          </name>
          <name name-style="western">
            <surname>Bergus</surname>
            <given-names>GR</given-names>
          </name>
          <name name-style="western">
            <surname>Levy</surname>
            <given-names>BT</given-names>
          </name>
          <name name-style="western">
            <surname>Chambliss</surname>
            <given-names>ML</given-names>
          </name>
          <name name-style="western">
            <surname>Evans</surname>
            <given-names>ER</given-names>
          </name>
        </person-group>
        <article-title>Analysis of questions asked by family doctors regarding patient care</article-title>
        <source>Br Med J</source>  
        <year>1999</year>  
        <month>08</month>  
        <day>07</day>  
        <volume>319</volume>  
        <issue>7206</issue>  
        <fpage>358</fpage>  
        <lpage>61</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/10435959"/>
        </comment>  
        <pub-id pub-id-type="medline">10435959</pub-id>
        <pub-id pub-id-type="pmcid">PMC28191</pub-id></nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>Publicity Department of National HealthFamily Planning Commission of the People?s Republic of China</collab>
          <collab>Chinese Health Education Center</collab>
        </person-group>
        <source>moh.gov</source>  
        <access-date>2017-05-27</access-date>
        <comment>2012 Chinese residents health literacy monitoring report 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.moh.gov.cn/zhuz/xzqq/201412/e09a26a97b914abb80172e85f46c5d84.shtml">http://www.moh.gov.cn/zhuz/xzqq/201412/e09a26a97b914abb80172e85f46c5d84.shtml</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6qlfPXCbQ"/></comment> </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Conway</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Doan</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Kawazoe</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Collier</surname>
            <given-names>N</given-names>
          </name>
        </person-group>
        <article-title>Classifying disease outbreak reports using n-grams and semantic features</article-title>
        <source>Int J Med Inform</source>  
        <year>2009</year>  
        <month>12</month>  
        <volume>78</volume>  
        <issue>12</issue>  
        <fpage>e47</fpage>  
        <lpage>58</lpage>  
        <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2009.03.010</pub-id>
        <pub-id pub-id-type="medline">19447070</pub-id>
        <pub-id pub-id-type="pii">S1386-5056(09)00053-7</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
