<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v21i2e12783</article-id>
      <article-id pub-id-type="pmid">30785407</article-id>
      <article-id pub-id-type="doi">10.2196/12783</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Tweet Classification Toward Twitter-Based Disease Surveillance: New Data, Methods, and Evaluations</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Cruvinel</surname>
            <given-names>Thiago</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Dini</surname>
            <given-names>Guglielmo</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="author" id="contrib1">
          <name name-style="western">
            <surname>Wakamiya</surname>
            <given-names>Shoko</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-9371-1340</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib2">
          <name name-style="western">
            <surname>Morita</surname>
            <given-names>Mizuki</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-8592-5499</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib3">
          <name name-style="western">
            <surname>Kano</surname>
            <given-names>Yoshinobu</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-7864-842X</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib4">
          <name name-style="western">
            <surname>Ohkuma</surname>
            <given-names>Tomoko</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-5078-4814</ext-link>
        </contrib>
        <contrib contrib-type="author" id="contrib5" corresp="yes">
          <name name-style="western">
            <surname>Aramaki</surname>
            <given-names>Eiji</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Institute for Research Initiatives</institution>
            <institution>Nara Institute of Science and Technology</institution>
            <addr-line>8916-5 Takayama-cho</addr-line>
            <addr-line>Ikoma, 630-0192</addr-line>
            <country>Japan</country>
            <phone>81 743 72 6053</phone>
            <fax>81 743 72 6065</fax>
            <email>socialcomputing-office@is.naist.jp</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-0201-3609</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
      <label>1</label>
      <institution>Institute for Research Initiatives</institution>
      <institution>Nara Institute of Science and Technology</institution>  
      <addr-line>Ikoma</addr-line>
      <country>Japan</country></aff>
      <aff id="aff2">
      <label>2</label>
      <institution>Graduate School of Science and Technology</institution>
      <institution>Nara Institute of Science and Technology</institution>  
      <addr-line>Ikoma</addr-line>
      <country>Japan</country></aff>
      <aff id="aff3">
      <label>3</label>
      <institution>Data Science Center</institution>
      <institution>Nara Institute of Science and Technology</institution>  
      <addr-line>Ikoma</addr-line>
      <country>Japan</country></aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Okayama University</institution>
        <addr-line>Okayama</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Shizuoka University</institution>
        <addr-line>Hamamatsu</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Fuji Xerox Co., Ltd.</institution>
        <addr-line>Yokohama</addr-line>
        <country>Japan</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Eiji Aramaki 
        <email>socialcomputing-office@is.naist.jp</email></corresp>
      </author-notes>
      <pub-date pub-type="collection"><month>02</month><year>2019</year></pub-date>
      <pub-date pub-type="epub">
        <day>20</day>
        <month>02</month>
        <year>2019</year>
      </pub-date>
      <volume>21</volume>
      <issue>2</issue>
      <elocation-id>e12783</elocation-id>
      <!--history from ojs - api-xml-->
      <history>
        <date date-type="received">
          <day>9</day>
          <month>11</month>
          <year>2018</year>
        </date>
        <date date-type="rev-request">
          <day>28</day>
          <month>11</month>
          <year>2018</year>
        </date>
        <date date-type="rev-recd">
          <day>12</day>
          <month>12</month>
          <year>2018</year>
        </date>
        <date date-type="accepted">
          <day>13</day>
          <month>12</month>
          <year>2018</year>
        </date>
      </history>
      <copyright-statement>©Shoko Wakamiya, Mizuki Morita, Yoshinobu Kano, Tomoko Ohkuma, Eiji Aramaki. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 20.02.2019.</copyright-statement>
      <copyright-year>2019</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://www.jmir.org/2019/2/e12783/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The amount of medical and clinical-related information on the Web is increasing. Among the different types of information available, social media–based data obtained directly from people are particularly valuable and are attracting significant attention. To encourage medical natural language processing (NLP) research exploiting social media data, the 13th NII Testbeds and Community for Information access Research (NTCIR-13) Medical natural language processing for Web document (MedWeb) provides pseudo-Twitter messages in a cross-language and multi-label corpus, covering 3 languages (Japanese, English, and Chinese) and annotated with 8 symptom labels (such as cold, fever, and flu). Then, participants classify each tweet into 1 of the 2 categories: those containing a patient’s symptom and those that do not.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to present the results of groups participating in a Japanese subtask, English subtask, and Chinese subtask along with discussions, to clarify the issues that need to be resolved in the field of medical NLP.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>In summary, 8 groups (19 systems) participated in the Japanese subtask, 4 groups (12 systems) participated in the English subtask, and 2 groups (6 systems) participated in the Chinese subtask. In total, 2 baseline systems were constructed for each subtask. The performance of the participant and baseline systems was assessed using the exact match accuracy, F-measure based on precision and recall, and Hamming loss.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The best system achieved exactly 0.880 match accuracy, 0.920 F-measure, and 0.019 Hamming loss. The averages of match accuracy, F-measure, and Hamming loss for the Japanese subtask were 0.720, 0.820, and 0.051; those for the English subtask were 0.770, 0.850, and 0.037; and those for the Chinese subtask were 0.810, 0.880, and 0.032, respectively.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This paper presented and discussed the performance of systems participating in the NTCIR-13 MedWeb task. As the MedWeb task settings can be formalized as the factualization of text, the achievement of this task could be directly applied to practical clinical applications.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>text mining</kwd>
        <kwd>social media</kwd>
        <kwd>machine learning</kwd>
        <kwd>natural language processing</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>surveillance</kwd>
        <kwd>infodemiology</kwd>
        <kwd>infoveillance</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Medical reports using electronic media are now replacing those of paper media [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. As a result, the importance of natural language processing (NLP) techniques in various medical fields has increased significantly. Currently, the development of practical tools to assist precise and timely medical decisions has been encouraged.</p>
      <p>To contribute to the progress of information retrieval research, a series of <italic>shared tasks</italic> (or contests, competitions, challenge evaluations, and critical assessments) is being used. Thus far, several shared tasks related to medical or health care have already been organized and provided datasets for various NLP tasks. These include the Informatics for Integrating Biology and the Bedside (i2b2) tasks [<xref ref-type="bibr" rid="ref3">3</xref>], the Text Retrieval Conference (TREC) Medical Records track [<xref ref-type="bibr" rid="ref4">4</xref>], TREC Clinical Decision Support or Precision Medicine tracks [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref9">9</xref>], the Cross-Language Evaluation Forum for European Languages (CLEF) eHealth [<xref ref-type="bibr" rid="ref10">10</xref>], and NII Testbeds and Community for Information access Research (NTCIR) Medical tasks and Medical Natural Language Processing (MedNLP) workshops [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. Generally, these shared tasks provide clinical records.</p>
      <p>On the other hand, with the widespread use of the internet, considerable material concerning medical or health care has been shared on the Web, and several Web mining techniques for utilizing the material have been developed. One of the most popular medical applications of Web mining is flu surveillance [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref27">27</xref>]. Although most previous studies have relied on shallow textual clues in messages, such as the number of occurrences of specific keywords (eg, <italic>flu</italic> or <italic>influenza</italic>), such simple approaches have difficulty coping with the volume of noisy messages. Typical examples of noisy tweets on Twitter are those that simply express concern or awareness about flu (such as “Starting to get worried about swine flu”). To increase their accuracy, one of the most reasonable approaches employs a binary classifier to filter out noisy messages.</p>
      <p>Given this situation, the NTCIR-13 [<xref ref-type="bibr" rid="ref28">28</xref>] Medical Natural Language Processing for Web Document (MedWeb) task [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>] is designed for obtaining health-related information by exploiting data on the Web, focusing on social media sites such as Twitter [<xref ref-type="bibr" rid="ref31">31</xref>] and Facebook [<xref ref-type="bibr" rid="ref32">32</xref>]. Specifically, we propose a generalized task setting that determines whether a message is written about a patient affected by a specific symptom for public health surveillance, referring to the following 2 characteristics:</p>
          <list list-type="order">
            <list-item>
      <p>Multi-label: This task handles not only a single symptom (such as influenza) but also multiple symptoms such as cold, cough or sore throat, diarrhea or stomach ache, fever, hay fever, headache, and runny nose. As a single message can contain multiple symptoms, this is a multi-labeling task.</p>
            </list-item>
            <list-item>
      <p>Cross-language: In contrast to the previous shared tasks, this task covers multiple languages, such as Japanese, English, and Chinese. To build parallel corpora, we translated the original Japanese messages to English and Chinese.</p>
            </list-item>
          </list>
      <p>In the NTCIR-13 MedWeb, we distributed each corpus to the participants [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref41">41</xref>], of whom 9 groups (7 academia groups, an industry group, and a joint group) submitted results (37 systems). Specifically, 8 groups (19 systems) participated in the Japanese subtask, 4 groups (12 systems) participated in the English subtask, and 2 groups (6 systems) participated in the Chinese subtask (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>). This report presents the results of these groups, along with discussions, to clarify the issues that need to be resolved in the field of medical NLP.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Materials</title>
        <sec>
          <title>Data</title>
          <p>The MedWeb task uses a collection of tweets that include at least one keyword of target diseases or symptoms (for brevity, we refer to these simply as <italic>symptoms</italic> hereafter). We set 8 symptoms, including cold, cough or sore throat (which we refer to as <italic>cough</italic>), diarrhea or stomachache (<italic>diarrhea</italic>), fever, hay fever, headache, influenza (<italic>flu</italic>), and runny nose.</p>
          <p>Owing to the Twitter Developer Policy on data redistribution [<xref ref-type="bibr" rid="ref42">42</xref>], the tweet data crawled using the application programming interface [<xref ref-type="bibr" rid="ref43">43</xref>] are not publicly available. Therefore, our data consist of pseudotweets created by a crowdsourcing service.</p>
          <p>To obtain the pseudotweets, we first collected Japanese tweets related to each symptom from Twitter. Then, we classified these tweets as positive or negative based on the previous study [<xref ref-type="bibr" rid="ref19">19</xref>]. Next, we extracted keyword sets that appeared frequently in the positive and negative tweets of the symptom by calculating term frequency and inverse document frequency. We call these keywords <italic>seed words</italic>.</p>
          <p>We then had a group of people create pseudotweets consisting of 100 to 140 characters, which included a symptom and at least one of the seed words of the symptom. Each person created 32 pseudotweets (2 tweets × 2 keyword sets [positive and negative] × 8 symptoms). As a result, 80 people were able to generate 2560 Japanese pseudotweets.</p>
          <p>In the last step, we had the Japanese pseudotweets translated into English and Chinese by relevant first-language practitioners. Therefore, we also had 2560 pseudotweets in both English and Chinese. The corpora are available in a previous paper [<xref ref-type="bibr" rid="ref44">44</xref>]. <xref ref-type="boxed-text" rid="box1">Textbox 1</xref> shows samples of each set of pseudotweets, whose ratios of positive labels are presented in <xref ref-type="table" rid="table1">Table 1</xref>. This table shows the ratio of positive labels out of each symptom’s 320 pseudotweets and the number of positive labels out of all symptoms’ 2560 pseudotweets. Common symptoms such as a runny nose, fever, headache, and cold tend to appear with the other symptoms. Then, the number of tweets of the flu labeled as <italic>p</italic> (positive) is relatively less than the others, indicating that the flu is likely to be a topic even if people did not suffer from flu. On the other hand, tweets concerning several symptoms such as a cough, headache, runny nose, and diarrhea are described in many cases when people suffered from them.</p>
          <boxed-text id="box1" position="float">
            <title>Samples of pseudotweets of the 8 symptoms. Note that English messages and Chinese messages were translated from Japanese messages.</title>
            <list list-type="order">
              <list-item>
                <p>Cold</p>
                <list list-type="bullet">
                  <list-item>
                    <p>風邪を引くと全身がだるくなる</p>
                  </list-item>
                  <list-item>
                    <p>The cold makes my whole body weak.</p>
                  </list-item>
                  <list-item>
                    <p>一感冒就浑身酸软无力。</p>
                  </list-item>
                </list>
              </list-item>
              <list-item>
                <p>Cough</p>
                <list list-type="bullet">
                  <list-item>
                    <p>あかん。咳込みすぎて頭まで痛くなってきた</p>
                  </list-item>
                  <list-item>
                    <p>This is not good. I coughed too much and I got a headache from it.</p>
                  </list-item>
                  <list-item>
                    <p>糟了。咳得太厉害，头都疼起来了。</p>
                  </list-item>
                </list>
              </list-item>
              <list-item>
                <p>Diarrhea</p>
                <list list-type="bullet">
                  <list-item>
                    <p>下痢ひどすぎで笑うわ</p>
                  </list-item>
                  <list-item>
                    <p>I gotta laugh. My diarrhea is so bad.</p>
                  </list-item>
                  <list-item>
                    <p>腹泻过于严重，很搞笑。</p>
                  </list-item>
                </list>
              </list-item>
              <list-item>
                <p>Fever</p>
                <list list-type="bullet">
                  <list-item>
                    <p>熱が出なくてもリンパが腫れることがよくある。</p>
                  </list-item>
                  <list-item>
                    <p>It’s not unusual for lymph nodes to get swollen, even when there’s no fever.</p>
                  </list-item>
                  <list-item>
                    <p>很多时候就算不发热淋巴也肿。</p>
                  </list-item>
                </list>
              </list-item>
              <list-item>
                <p>Hay fever</p>
                <list list-type="bullet">
                  <list-item>
                    <p>花粉症の症状が出てきたのは久し振りだ。</p>
                  </list-item>
                  <list-item>
                    <p>It’s been a while since I’ve had allergy symptoms.</p>
                  </list-item>
                  <list-item>
                    <p>好久没有出现花粉症的症状了。</p>
                  </list-item>
                </list>
              </list-item>
              <list-item>
                <p>Headache</p>
                <list list-type="bullet">
                  <list-item>
                    <p>頭痛がやばいから帰宅して寝るー</p>
                  </list-item>
                  <list-item>
                    <p>My headache is killing me, so I’m going to go home and sleep.</p>
                  </list-item>
                  <list-item>
                    <p>因为头疼得厉害，我回家睡觉了。</p>
                  </list-item>
                </list>
              </list-item>
              <list-item>
                <p>Flu</p>
                <list list-type="bullet">
                  <list-item>
                    <p>インフルエンザのワクチン打ちに行ってきた。</p>
                  </list-item>
                  <list-item>
                    <p>I went to get vaccinated for the flu.</p>
                  </list-item>
                  <list-item>
                    <p>去打了流感的疫苗。</p>
                  </list-item>
                </list>
              </list-item>
              <list-item>
                <p>Runny nose</p>
                <list list-type="bullet">
                  <list-item>
                    <p>鼻づまりで今日は休むわー</p>
                  </list-item>
                  <list-item>
                    <p>I’m not going today, because my stuffy nose is killing me.</p>
                  </list-item>
                  <list-item>
                    <p>因为鼻塞，今天休息吧！</p>
                  </list-item>
                </list>
              </list-item>
            </list>
          </boxed-text>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Ratio of positive labels.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="200"/>
              <col width="400"/>
              <col width="400"/>
              <thead>
                <tr valign="top">
                  <td>Symptom</td>
                  <td>Ratio of number of positive tweets to the number of each symptom’s tweets (N=320 tweets)</td>
                  <td>Ratio of number of positive tweets to the total number of all symptoms’ tweets (N=2560 tweets)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Cold, n (%)</td>
                  <td>220 (0.6875)</td>
                  <td>355 (0.1387)</td>
                </tr>
                <tr valign="top">
                  <td>Cough, n (%)</td>
                  <td>295 (0.9219)</td>
                  <td>306 (0.1195)</td>
                </tr>
                <tr valign="top">
                  <td>Diarrhea, n (%)</td>
                  <td>230 (0.7188)</td>
                  <td>246 (0.0961)</td>
                </tr>
                <tr valign="top">
                  <td>Fever, n (%)</td>
                  <td>220 (0.6875)</td>
                  <td>438 (0.1711)</td>
                </tr>
                <tr valign="top">
                  <td>Hay fever, n (%)</td>
                  <td>208 (0.6500)</td>
                  <td>209 (0.0816)</td>
                </tr>
                <tr valign="top">
                  <td>Headache, n (%)</td>
                  <td>260 (0.8125)</td>
                  <td>328 (0.1281)</td>
                </tr>
                <tr valign="top">
                  <td>Flu, n (%)</td>
                  <td>128 (0.4000)</td>
                  <td>130 (0.0508)</td>
                </tr>
                <tr valign="top">
                  <td>Runny nose, n (%)</td>
                  <td>257 (0.8031)</td>
                  <td>499 (0.1949)</td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Samples of the training data corpus for the English subtask.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="80"/>
              <col width="280"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <col width="80"/>
              <thead>
                <tr valign="top">
                  <td>Tweet ID</td>
                  <td>Message</td>
                  <td>s<sub>1</sub><sup>a</sup></td>
                  <td>s<sub>2</sub></td>
                  <td>s<sub>3</sub></td>
                  <td>s<sub>4</sub></td>
                  <td>s<sub>5</sub></td>
                  <td>s<sub>6</sub></td>
                  <td>s<sub>7</sub></td>
                  <td>s<sub>8</sub></td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>1en<sup>b</sup></td>
                  <td>The cold makes my whole body weak.</td>
                  <td>p<sup>c</sup></td>
                  <td>n<sup>d</sup></td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                </tr>
                <tr valign="top">
                  <td>2en</td>
                  <td>It’s been a while since I’ve had allergy symptoms.</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>p</td>
                  <td>n</td>
                  <td>n</td>
                  <td>p</td>
                </tr>
                <tr valign="top">
                  <td>3en</td>
                  <td>I’m so feverish and out of it because of my allergies. I’m so sleepy.</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>p</td>
                  <td>p</td>
                  <td>n</td>
                  <td>n</td>
                  <td>p</td>
                </tr>
                <tr valign="top">
                  <td>4en</td>
                  <td>I took some medicine for my runny nose, but it won’t stop.</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>p</td>
                </tr>
                <tr valign="top">
                  <td>5en</td>
                  <td>I had a bad case of diarrhea when I traveled to Nepal.</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                </tr>
                <tr valign="top">
                  <td>6en</td>
                  <td>It takes a millennial wimp to call in sick just because they’re coughing. It’s always important to go to work, no matter what.</td>
                  <td>n</td>
                  <td>p</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                </tr>
                <tr valign="top">
                  <td>7en</td>
                  <td>I’m not going today, because my stuffy nose is killing me.</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>p</td>
                </tr>
                <tr valign="top">
                  <td>8en</td>
                  <td>I never thought I would have allergies.</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>p</td>
                  <td>n</td>
                  <td>n</td>
                  <td>p</td>
                </tr>
                <tr valign="top">
                  <td>9en</td>
                  <td>I have a fever but I don’t think it’s the kind of cold that will make it to my stomach.</td>
                  <td>p</td>
                  <td>n</td>
                  <td>n</td>
                  <td>p</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                </tr>
                <tr valign="top">
                  <td>10en</td>
                  <td>My phlegm has blood in it and it’s really gross.</td>
                  <td>n</td>
                  <td>p</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                  <td>n</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table2fn1">
                <p><sup>a</sup>s<sub>1</sub>, s<sub>2</sub>, s<sub>3</sub>, s<sub>4</sub>, s<sub>5</sub>, s<sub>6</sub>, s<sub>7</sub>, and s<sub>8</sub> are IDs of the 8 symptoms (cold, cough, diarrhea, fever, hay fever, headache, flu, and runny nose).</p>
              </fn>
              <fn id="table2fn2">
                <p><sup>b</sup>ID corresponds to the corpora of other languages (eg, the tweet of <italic>1en</italic> corresponds to the tweets of <italic>1ja</italic> and <italic>1zh</italic>).</p>
              </fn>
              <fn id="table2fn3">
                <p><sup>c</sup>p indicates the positive label.</p>
              </fn>
              <fn id="table2fn4">
                <p><sup>d</sup>n indicates the negative label.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Symptom Labeling</title>
          <p>This section describes the criteria used for symptom labeling: basic criteria and symptom-specific criteria [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref46">46</xref>]. In this study, 2 annotators attached positive or negative labels of the 8 symptoms to tweets (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
          <sec>
            <title>Basic Criteria</title>
            <p>The most basic criterion is that the labeling is examined from a clinical viewpoint, considering the medical importance of the information. Thus, nonclinical information should be disregarded. For example, older information (by several weeks) and nonsevere symptoms (a headache due to overdrinking) should be labeled as <italic>n</italic> (negative).</p>
            <p>The following 3 criteria describe the basic principles:</p>
          <list list-type="order">
            <list-item>
            <p>Factuality: The Twitter user (or someone close to the user) should be affected by a certain disease or have a symptom of the disease. A tweet that includes only the name of a disease or a symptom as a topic is removed by labeling it as <italic>n</italic> (negative).</p>
            </list-item>
            <list-item>
            <p>Tense (time): Older information, which is meaningless from the viewpoint of surveillance, should be discarded. Such information should also be labeled as <italic>n</italic> (negative). Here, we regard 24 hours as the standard condition. When the precise date and time are ambiguous, the general guideline is that information within 24 hours (eg, information related to the present day or previous day) is labeled as <italic>p</italic> (positive).</p>
            </list-item>
            <list-item>
            <p>Location: The location of the disease should be specified as follows. If a Twitter user is affected, the information is labeled as <italic>p</italic> (positive) because the location of the user is the place of onset of the symptom. In cases where the user is not personally affected, the information is labeled as <italic>p</italic> (positive) if it is within the same vicinity (prefecture) as that of the user, and as <italic>n</italic> (negative) otherwise.</p>
            </list-item>
          </list>
          </sec>
          <sec>
            <title>Symptom-Specific Criteria</title>
            <p>There are several exceptions to the fundamental annotation principles. For example, a remark about a <italic>headache</italic> might not relate to that about a clinical disease (such as headache due to excessive drinking). When conducting disease surveillance, such statements should be regarded as noise. To deal with disease-specific phenomena, we build a guideline that addresses exceptions for each disease. For example, cases such as <italic>excessive drinking</italic>, <italic>medication</italic>, <italic>pungently flavored food (including irritant),</italic> <italic>spiritual,</italic> <italic>motion sickness,</italic> <italic>morning,</italic> and <italic>menstrual pain</italic> should be excluded for <italic>headache.</italic> The exceptions are summarized in <xref ref-type="table" rid="table3">Table 3</xref>.</p>
          </sec>
        </sec>
      </sec>
      <sec>
        <title>Task Settings</title>
        <p>In the MedWeb task, we organized 3 subtasks: a Japanese subtask, an English subtask, and a Chinese subtask. The procedure of the MedWeb task is as follows:</p>
        <p><italic>Step 1.</italic> Training corpus distribution: The training data corpus and the annotation criteria were sent to the participant groups for development. The training data corpus comprises 1920 messages (75.00% of the whole corpus), with labels. Each message is labeled <italic>p</italic> (positive) or <italic>n</italic> (negative) for each of the 8 symptoms.</p>
        <p><italic>Step 2.</italic> Formal run result submission: After about a 3-month development period, the test data corpus was sent to each participant group. The test data corpus consists of 640 messages (25.0% of the whole corpus), without labels. Then, the participant groups developed their systems (<xref ref-type="table" rid="table4">Table 4</xref>) and submitted their annotated results within 2 weeks. Multiple results with up to 3 systems were allowed to be submitted.</p>
        <p><italic>Step 3.</italic> Evaluation result release: After a 1-month evaluation period, the evaluation results and annotated test data were sent to each participant group.</p>
      </sec>
      <sec>
        <title>Systems</title>
        <sec>
          <title>Baseline Systems</title>
          <p>As a baseline, 2 systems were constructed using a support vector machine (SVM) based on unigram and bigram features. For feature representation, the bag-of-words model was used in each system. A tweet message was segmented using MeCab, created by Kudo et al [<xref ref-type="bibr" rid="ref47">47</xref>] for Japanese messages, natural language toolkit (NLTK) TweetTokenizer, created by Bird [<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref49">49</xref>] for English messages, and jieba, created by Junyi [<xref ref-type="bibr" rid="ref50">50</xref>] for Chinese messages. The 2 systems had a linear kernel, and the parameter for regularization, <italic>C</italic>, was set to 1. The baseline systems were implemented using scikit-learn (sklearn) [<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref52">52</xref>].</p>
        </sec>
        <sec>
          <title>Participating Systems</title>
          <p>In all, 37 systems (of 9 groups) participated and had their results submitted in the MedWeb. Of these, 19 systems (of 8 groups) submitted results for the Japanese subtask, 12 systems (of 4 groups) for the English subtask, and 6 systems (of 2 groups) for the Chinese subtask. The participating systems for the Japanese, English, and Chinese subtasks are summarized in <xref ref-type="table" rid="table4">Table 4</xref>.</p>
            <table-wrap position="float" id="table3">
              <label>Table 3</label>
              <caption>
                <p>Exceptions for symptom labels.</p>
              </caption>
              <table width="100%" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
                <col width="46*"/>
                <col width="51*"/>
                <col width="54*"/>
                <col width="56*"/>
                <col width="49*"/>
                <thead>
                  <tr valign="top">
                    <td rowspan="2">Symptom</td>
                    <td rowspan="2">Expressions with suspicion</td>
                    <td rowspan="2">Just a symptom word</td>
                    <td colspan="2">Exceptions</td>
                  </tr>
                  <tr valign="top">
                    <td>Regarded as symptom</td>
                    <td>Not regarded as symptom</td>
                  </tr>
                </thead>
                <tbody>
                  <tr valign="top">
                    <td>Cold</td>
                    <td>Accept</td>
                    <td>Accept</td>
                    <td>—<sup>a</sup></td>
                    <td>—</td>
                  </tr>
                  <tr valign="top">
                    <td>Cough</td>
                    <td>Accept</td>
                    <td>Accept</td>
                    <td>Alcohol drinking and pungently flavored food</td>
                    <td>—</td>
                  </tr>
                  <tr valign="top">
                    <td>Diarrhea</td>
                    <td>Accept</td>
                    <td>Accept</td>
                    <td>Overeating, indigestion, alcohol drinking, medication, and pungently flavored food</td>
                    <td>—</td>
                  </tr>
                  <tr valign="top">
                    <td>Fever</td>
                    <td>Accept</td>
                    <td>Only <italic>slight fever</italic></td>
                    <td>Hay fever and side effect due to any injection</td>
                    <td>—</td>
                  </tr>
                  <tr valign="top">
                    <td>Hay fever</td>
                    <td>Accept</td>
                    <td>Accept</td>
                    <td>—</td>
                    <td>—</td>
                  </tr>
                  <tr valign="top">
                    <td>Headache</td>
                    <td>Accept</td>
                    <td>Accept</td>
                    <td>—</td>
                    <td>Due to a sense of sight or smell</td>
                  </tr>
                  <tr valign="top">
                    <td>Flu</td>
                    <td>Not accept</td>
                    <td>Not accept</td>
                    <td>—</td>
                    <td>—</td>
                  </tr>
                  <tr valign="top">
                    <td>Runny nose</td>
                    <td>Accept</td>
                    <td>Not accept</td>
                    <td>Hay fever</td>
                    <td>Change in temperature</td>
                  </tr>
                </tbody>
              </table>
              <table-wrap-foot>
                <fn id="table3fn1">
                  <p><sup>a</sup>Indicates there are no exceptions.</p>
                </fn>
              </table-wrap-foot>
            </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Participating systems in subtasks. A total of 19 participating systems and 2 baseline systems are constructed for the Japanese subtask, 12 participating systems and 2 baseline systems are constructed for the English subtask, and 6 participating systems and 2 baseline systems are constructed for the Chinese subtask.</p>
          </caption>
          <table width="100%" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="40*"/>
            <col width="115*"/>
            <col width="101*"/>
            <thead>
              <tr valign="top">
                <td>System ID</td>
                <td>Models or methods</td>
                <td>Language resources</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>AITOK-ja [<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td>Keyword-based, logistic regression, and SVM<sup>a,b</sup></td>
                <td>—<sup>c</sup></td>
              </tr>
              <tr valign="top">
                <td>AKBL-ja and AKBL-en [<xref ref-type="bibr" rid="ref34">34</xref>]</td>
                <td>SVM and Fisher exact test</td>
                <td>Patient symptom feature word dictionary and Disease-X feature words dict1 and dict2</td>
              </tr>
              <tr valign="top">
                <td>DrG-ja [<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                <td>Random forest</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>KIS-ja [<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>Rule-based and SVM</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>NAIST-ja, NAIST-en, and NAIST-zh [<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                <td>Ensembles of hierarchical attention network and deep character-level convolutional neural network with loss functions (negative loss function, hinge, and hinge squared)</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>NIL-ja [<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>Rule-based</td>
                <td>—</td>
              </tr>
              <tr valign="top">
                <td>NTTMU-ja [<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                <td>Principle-based approach</td>
                <td>Manually constructed knowledge for capturing tweets that conveyed flu-related information, using common sense and ICD-10<sup>d</sup></td>
              </tr>
              <tr valign="top">
                <td>NTTMU-en [<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                <td>SVM and recurrent neural network</td>
                <td>Manually constructed knowledge for capturing tweets that conveyed flu-related information, using common sense and ICD-10</td>
              </tr>
              <tr valign="top">
                <td>TUA1-zh [<xref ref-type="bibr" rid="ref40">40</xref>]</td>
                <td>Logistic regression, SVM, and logistic regression with semantic information</td>
                <td>Updated training samples using active learning unlabeled posts downloaded with the symptom names in Chinese</td>
              </tr>
              <tr valign="top">
                <td>UE-ja [<xref ref-type="bibr" rid="ref41">41</xref>]</td>
                <td>Rule-based and random forest</td>
                <td>Custom dictionary consisting of nouns selected from the dry-run dataset and heuristics</td>
              </tr>
              <tr valign="top">
                <td>UE-en [<xref ref-type="bibr" rid="ref41">41</xref>]</td>
                <td>Rule-based, random forests, and skip-gram neural network for word2vec</td>
                <td>Custom dictionary consisting of nouns selected from the dry-run dataset and heuristics</td>
              </tr>
              <tr valign="top">
                <td>Baseline</td>
                <td>SVM (unigram and bigram)</td>
                <td>—</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>SVM: support vector machine.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>It indicates that the method was tested after the submission of the formal run, and thus, it was not included in the results.</p>
            </fn>
            <fn id="table4fn3">
              <p><sup>c</sup>It indicates that any language resources were not used.</p>
            </fn>
            <fn id="table4fn4">
              <p><sup>d</sup>ICD: International Codes for Diseases.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
          <p>As for the Japanese subtask, most of the groups applied machine learning approaches, such as SVM (as in the baseline systems), random forests, and neural networks. Several groups constructed their own resources to enhance the original training corpus. Similarly, for the English subtask, most of the groups applied machine learning approaches, such as SVM, random forests, and neural networks. The Chinese subtask had 2 participating groups: one applied the same methods as the other subtasks and the other used logistic regression and SVM and updated the training data using active learning.</p>
        </sec>
      </sec>
      <sec>
        <title>Evaluation Metrics</title>
        <p>The performance in the subtasks was assessed using the exact match accuracy, F-measure (beta=1) (<italic>F1</italic>) based on precision and recall, and Hamming loss [<xref ref-type="bibr" rid="ref53">53</xref>].</p>
        <p>The details of the metrics are as follows.</p>
        <list list-type="bullet">
          <list-item>
            <p>Exact match accuracy: If <italic>y’</italic><sup><italic>(i)</italic> </sup> indicates the predicted symptom label values of the <italic>i</italic>-th tweet and <italic>y</italic><sup><italic>(i)</italic> </sup> is the corresponding true labels, then the fraction of correct predictions over the test data corpus (<italic>N</italic>=640) is calculated as follows: <italic>accuracy(y, y’)=1/N</italic> <italic>∙∑</italic><sup><italic>N</italic> </sup><sub><italic>i=1</italic> </sub><italic>1(</italic> <italic>y’</italic><sup><italic>(i)</italic> </sup><italic>=y</italic><sup><italic>(i)</italic> </sup><italic>),</italic> where <italic>1(.)</italic> is the indicator function, which returns 1 if the entire set of predicted labels for a tweet strictly matches with the true set of labels.</p>
          </list-item>
          <list-item>
            <p>Precision (micro or macro): It is defined as the number of true positives (<italic>T</italic><sub><italic>p</italic> </sub>) over the sum of the number of true positive and false positives (<italic>F</italic><sub><italic>p</italic> </sub>): <italic>precision=T</italic><sub><italic>p</italic> </sub><italic>/(T</italic><sub><italic>p</italic> </sub><italic>+F</italic><sub><italic>p</italic> </sub><italic>)</italic>.</p>
          </list-item>
          <list-item>
            <p>Recall (micro or macro): It is defined as the number of true positives (<italic>T</italic><sub><italic>p</italic> </sub>) over the sum of the number of true positive and false negatives (<italic>F</italic><sub><italic>n</italic> </sub>): <italic>recall=T</italic><sub><italic>p</italic> </sub><italic>/(T</italic><sub><italic>p</italic> </sub><italic>+F</italic><sub><italic>n</italic> </sub><italic>)</italic>.</p>
          </list-item>
          <list-item>
            <p>F1 (micro or macro): The harmonic mean of precision and recall is calculated as follows: <italic>F1=2∙precision∙recall/(precision+recall).</italic></p>
          </list-item>
          <list-item>
            <p>Hamming loss: It computes the average Hamming loss between two sets of labels. If <italic>y’</italic><sup><italic>(i)</italic> </sup> is the predicted value for the <italic>j</italic>-th label of the <italic>i</italic>-th tweet, <italic>y</italic><sup><italic>(i)</italic> </sup><sub><italic>j</italic> </sub> is the corresponding true value, <italic>N</italic> is the number of test data (<italic>N</italic>=640), and <italic>L</italic> is the number of labels (<italic>L</italic>=8), then the Hamming loss between the predicted and correct labels is calculated as follows: <italic>L</italic><sub><italic>Hamming</italic> </sub><italic>(y,y’)=1/N</italic> <italic>∙1/L∙∑</italic><sup><italic>N</italic> </sup><sub><italic>i=1</italic> </sub><italic>∑</italic><sup><italic>L</italic> </sup><sub><italic>j=1</italic></sub><italic>1(</italic><italic>y’</italic><sup><italic>(i)</italic> </sup><sub><italic>j</italic> </sub><italic>≠y</italic><sup><italic>(i)</italic> </sup><sub><italic>j</italic> </sub><italic>),</italic> where <italic>1(.)</italic> is the indicator function. Note that lower scores are better.</p>
          </list-item>
        </list>
        <p>Note that <italic>micro</italic> is to calculate metrics globally by counting all true positives, false negatives, and false positives: <italic>F1micro=2∙precisionmicro∙recallmicro/(precisionmicro+recallmicro)</italic>.</p>
        <p>On the other hand, <italic>macro</italic> calculates the metrics for each symptom label and then determines their unweighted mean: <italic>F1macro=1/L∙∑</italic><sup><italic>L</italic> </sup><sub><italic>j=1</italic> </sub><italic>F1</italic><sub><italic>j</italic> </sub><italic>.</italic> Therefore, label imbalance is not taken into account.</p>
      </sec>
      <sec>
        <title>Ethics Statement</title>
        <p>This study did not require the participants to be involved in any physical and/or mental intervention. As this research did not use personally identifiable information, it was exempted from the institutional review board approval in accordance with the Ethical Guidelines for Medical and Health Research Involving Human Subjects stipulated by the Japanese national government.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Symptom Labeling Reliability</title>
        <p>To show the reliability of symptom labeling to the corpus, the interannotation agreement ratios of the respective symptoms were measured (<xref ref-type="table" rid="table5">Table 5</xref>). The total interannotator agreement ratio (n=2) was 0.9851 (ie, 20,174 / [2560 × 8]).</p>
      </sec>
      <sec>
        <title>Performance of Baseline Systems</title>
        <p>The performance of the baseline was measured using all evaluation metrics. <xref ref-type="table" rid="table6">Tables 6</xref>-<xref ref-type="table" rid="table8">8</xref> show the results for the Japanese, English, and Chinese subtasks, respectively.</p>
        <p>For the Japanese and Chinese subtasks, unigram SVM performed better than bigram SVM. On the other hand, bigram SVM outperformed unigram SVM in the English subtask. The highest average of exact match accuracy was 0.791 (English subtask) and the lowest was 0.756 (Japanese subtask).</p>
      </sec>
      <sec>
        <title>Performance of Participating Systems</title>
        <p>The performance of the participating systems was also measured using all evaluation metrics. <xref ref-type="table" rid="table6">Tables 6</xref>-<xref ref-type="table" rid="table8">8</xref> show the results for the Japanese, English, and Chinese subtasks, respectively, ordered by the exact match accuracy of the systems.</p>
        <p>For the Japanese subtask, the best system, NAIST-ja-2, achieved 0.880 in exact match accuracy, 0.920 in F-measure, and 0.019 in Hamming loss, as shown in <xref ref-type="table" rid="table6">Table 6</xref>. The averages across the participating groups and the baseline systems were 0.720, 0.820, and 0.051, respectively. The rank order of the top 4 systems was the same in all measures. The systems of the AKBL and KIS groups were constructed using an SVM, as in the baseline systems. The AKBL group’s results indicated that their system was effective in terms of using additional language resources. The KIS group switched their methods between an SVM and a rule-based method, depending on the confidence factor.</p>
        <p>For the English subtask, the best system, NAIST-en-2, achieved 0.880 in exact match accuracy, 0.920 in F-measure, and 0.019 in Hamming loss, as shown in <xref ref-type="table" rid="table7">Table 7</xref>. The system was constructed using the same method as that used in the Japanese subtask. The averages across the participating groups and the baseline systems were 0.770, 0.850, and 0.037, respectively.</p>
        <p>For the Chinese subtask, the best system, NAIST-zh-2, achieved 0.880 in exact match accuracy, 0.920 in F-measure, and 0.019 in Hamming loss, as shown in <xref ref-type="table" rid="table8">Table 8</xref>. The system was constructed using the same method as that used in the Japanese and English subtasks. The averages across the participating groups and the baseline systems were 0.810, 0.880, and 0.032, respectively.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Interannotator agreement ratio.</p>
          </caption>
          <table width="100%" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="102*"/>
            <col width="154*"/>
            <thead>
              <tr valign="top">
                <td>Symptom</td>
                <td>Agreement ratio (number)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Cold</td>
                <td>0.9945 (2546/2560)</td>
              </tr>
              <tr valign="top">
                <td>Cough</td>
                <td>0.9934 (2543/2560)</td>
              </tr>
              <tr valign="top">
                <td>Diarrhea</td>
                <td>0.9785 (2505/2560)</td>
              </tr>
              <tr valign="top">
                <td>Fever</td>
                <td>0.9922 (2540/2560)</td>
              </tr>
              <tr valign="top">
                <td>Hay fever</td>
                <td>0.9918 (2539/2560)</td>
              </tr>
              <tr valign="top">
                <td>Headache</td>
                <td>0.9773 (2502/2560)</td>
              </tr>
              <tr valign="top">
                <td>Flu</td>
                <td>0.9734 (2492/2560)</td>
              </tr>
              <tr valign="top">
                <td>Runny nose</td>
                <td>0.9793 (2507/2560)</td>
              </tr>
              <tr valign="top">
                <td>Total</td>
                <td>0.9851 (20,174/20,480)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>Performance in the Japanese subtask (19 participating systems and 2 baseline systems).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="150"/>
            <col width="80"/>
            <col width="100"/>
            <col width="100"/>
            <col width="70"/>
            <col width="100"/>
            <col width="100"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td rowspan="2">System ID<sup>a</sup></td>
                <td rowspan="2">Exact match<sup>b</sup></td>
                <td colspan="2">F1</td>
                <td colspan="2">Precision</td>
                <td colspan="2">Recall</td>
                <td rowspan="2">Hamming loss</td>
              </tr>
              <tr valign="top">
                <td>Micro</td>
                <td>Macro</td>
                <td>Micro</td>
                <td>Macro</td>
                <td>Micro</td>
                <td>Macro</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>NAIST-ja-2</td>
                <td>0.880</td>
                <td>0.920</td>
                <td>0.906</td>
                <td>0.899</td>
                <td>0.887</td>
                <td>0.941</td>
                <td>0.925</td>
                <td>0.019</td>
              </tr>
              <tr valign="top">
                <td>NAIST-ja-3</td>
                <td>0.878</td>
                <td>0.919</td>
                <td>0.904</td>
                <td>0.899</td>
                <td>0.885</td>
                <td>0.940</td>
                <td>0.924</td>
                <td>0.019</td>
              </tr>
              <tr valign="top">
                <td>NAIST-ja-1</td>
                <td>0.877</td>
                <td>0.918</td>
                <td>0.904</td>
                <td>0.899</td>
                <td>0.887</td>
                <td>0.938</td>
                <td>0.921</td>
                <td>0.020</td>
              </tr>
              <tr valign="top">
                <td>AKBL-ja-3</td>
                <td>0.805</td>
                <td>0.872</td>
                <td>0.859</td>
                <td>0.896</td>
                <td>0.883</td>
                <td>0.849</td>
                <td>0.839</td>
                <td>0.029</td>
              </tr>
              <tr valign="top">
                <td>UE-ja-1</td>
                <td>0.805</td>
                <td>0.865</td>
                <td>0.855</td>
                <td>0.831</td>
                <td>0.819</td>
                <td>0.903</td>
                <td>0.902</td>
                <td>0.033</td>
              </tr>
              <tr valign="top">
                <td>KIS-ja-2</td>
                <td>0.802</td>
                <td>0.871</td>
                <td>0.856</td>
                <td>0.831</td>
                <td>0.815</td>
                <td>0.915</td>
                <td>0.904</td>
                <td>0.032</td>
              </tr>
              <tr valign="top">
                <td>AKBL-ja-1</td>
                <td>0.800</td>
                <td>0.869</td>
                <td>0.847</td>
                <td>0.889</td>
                <td>0.873</td>
                <td>0.849</td>
                <td>0.825</td>
                <td>0.030</td>
              </tr>
              <tr valign="top">
                <td>UE-ja-3</td>
                <td>0.800</td>
                <td>0.866</td>
                <td>0.855</td>
                <td>0.823</td>
                <td>0.812</td>
                <td>0.913</td>
                <td>0.911</td>
                <td>0.033</td>
              </tr>
              <tr valign="top">
                <td>AKBL-ja-2</td>
                <td>0.795</td>
                <td>0.868</td>
                <td>0.849</td>
                <td>0.891</td>
                <td>0.875</td>
                <td>0.846</td>
                <td>0.827</td>
                <td>0.030</td>
              </tr>
              <tr valign="top">
                <td>KIS-ja-3</td>
                <td>0.784</td>
                <td>0.855</td>
                <td>0.831</td>
                <td>0.840</td>
                <td>0.816</td>
                <td>0.871</td>
                <td>0.850</td>
                <td>0.034</td>
              </tr>
              <tr valign="top">
                <td>SVM-unigram</td>
                <td>0.761</td>
                <td>0.849</td>
                <td>0.835</td>
                <td>0.843</td>
                <td>0.828</td>
                <td>0.854</td>
                <td>0.842</td>
                <td>0.036</td>
              </tr>
              <tr valign="top">
                <td>KIS-ja-1</td>
                <td>0.758</td>
                <td>0.849</td>
                <td>0.833</td>
                <td>0.798</td>
                <td>0.782</td>
                <td>0.906</td>
                <td>0.899</td>
                <td>0.038</td>
              </tr>
              <tr valign="top">
                <td>SVM-bigram</td>
                <td>0.752</td>
                <td>0.843</td>
                <td>0.830</td>
                <td>0.838</td>
                <td>0.820</td>
                <td>0.848</td>
                <td>0.845</td>
                <td>0.037</td>
              </tr>
              <tr valign="top">
                <td>NTTMU-ja-1</td>
                <td>0.738</td>
                <td>0.835</td>
                <td>0.829</td>
                <td>0.770</td>
                <td>0.761</td>
                <td>0.913</td>
                <td>0.921</td>
                <td>0.042</td>
              </tr>
              <tr valign="top">
                <td>UE-ja-2</td>
                <td>0.706</td>
                <td>0.815</td>
                <td>0.803</td>
                <td>0.696</td>
                <td>0.702</td>
                <td>0.983</td>
                <td>0.984</td>
                <td>0.052</td>
              </tr>
              <tr valign="top">
                <td>NIL-ja-1</td>
                <td>0.680</td>
                <td>0.749</td>
                <td>0.742</td>
                <td>0.862</td>
                <td>0.845</td>
                <td>0.662</td>
                <td>0.671</td>
                <td>0.052</td>
              </tr>
              <tr valign="top">
                <td>DrG-ja-1</td>
                <td>0.653</td>
                <td>0.777</td>
                <td>0.774</td>
                <td>0.825</td>
                <td>0.808</td>
                <td>0.734</td>
                <td>0.779</td>
                <td>0.049</td>
              </tr>
              <tr valign="top">
                <td>NTTMU-ja-3</td>
                <td>0.614</td>
                <td>0.775</td>
                <td>0.773</td>
                <td>0.740</td>
                <td>0.720</td>
                <td>0.814</td>
                <td>0.840</td>
                <td>0.055</td>
              </tr>
              <tr valign="top">
                <td>NTTMU-ja-2</td>
                <td>0.597</td>
                <td>0.770</td>
                <td>0.753</td>
                <td>0.741</td>
                <td>0.706</td>
                <td>0.801</td>
                <td>0.813</td>
                <td>0.056</td>
              </tr>
              <tr valign="top">
                <td>AITOK-ja-2</td>
                <td>0.503</td>
                <td>0.706</td>
                <td>0.696</td>
                <td>0.726</td>
                <td>0.738</td>
                <td>0.687</td>
                <td>0.767</td>
                <td>0.067</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>The system ID comprises the group ID (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>), the abbreviation of subtask (ja indicates Japanese subtask), and the system number from 1 to 3 since each group can submit three systems per subtask.</p>
            </fn>
            <fn id="table6fn2">
              <p><sup>b</sup>The results are ordered by exact match accuracy.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table7">
          <label>Table 7</label>
          <caption>
            <p>Performance in the English subtask (12 participating systems and 2 baseline systems).</p>
          </caption>
          <table width="1000" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="150"/>
            <col width="80"/>
            <col width="100"/>
            <col width="100"/>
            <col width="80"/>
            <col width="90"/>
            <col width="100"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td rowspan="2">System ID<sup>a</sup></td>
                <td rowspan="2">Exact match<sup>b</sup></td>
                <td colspan="2">F1</td>
                <td colspan="2">Precision</td>
                <td colspan="2">Recall</td>
                <td rowspan="2">Hamming loss</td>
              </tr>
              <tr valign="top">
                <td>Micro</td>
                <td>Macro</td>
                <td>Micro</td>
                <td>Macro</td>
                <td>Micro</td>
                <td>Macro</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>NAIST-en-2</td>
                <td>0.880</td>
                <td>0.920</td>
                <td>0.906</td>
                <td>0.899</td>
                <td>0.887</td>
                <td>0.941</td>
                <td>0.925</td>
                <td>0.019</td>
              </tr>
              <tr valign="top">
                <td>NAIST-en-3</td>
                <td>0.878</td>
                <td>0.919</td>
                <td>0.904</td>
                <td>0.899</td>
                <td>0.885</td>
                <td>0.940</td>
                <td>0.924</td>
                <td>0.019</td>
              </tr>
              <tr valign="top">
                <td>NAIST-en-1</td>
                <td>0.877</td>
                <td>0.918</td>
                <td>0.904</td>
                <td>0.899</td>
                <td>0.887</td>
                <td>0.938</td>
                <td>0.921</td>
                <td>0.020</td>
              </tr>
              <tr valign="top">
                <td>SVM-bigram</td>
                <td>0.800</td>
                <td>0.866</td>
                <td>0.856</td>
                <td>0.865</td>
                <td>0.849</td>
                <td>0.868</td>
                <td>0.865</td>
                <td>0.031</td>
              </tr>
              <tr valign="top">
                <td>UE-en-1</td>
                <td>0.789</td>
                <td>0.858</td>
                <td>0.848</td>
                <td>0.846</td>
                <td>0.831</td>
                <td>0.871</td>
                <td>0.876</td>
                <td>0.034</td>
              </tr>
              <tr valign="top">
                <td>SVM-unigram</td>
                <td>0.783</td>
                <td>0.858</td>
                <td>0.845</td>
                <td>0.851</td>
                <td>0.830</td>
                <td>0.864</td>
                <td>0.864</td>
                <td>0.033</td>
              </tr>
              <tr valign="top">
                <td>NTTMU-en-2</td>
                <td>0.773</td>
                <td>0.856</td>
                <td>0.849</td>
                <td>0.807</td>
                <td>0.796</td>
                <td>0.911</td>
                <td>0.918</td>
                <td>0.036</td>
              </tr>
              <tr valign="top">
                <td>NTTMU-en-3</td>
                <td>0.758</td>
                <td>0.845</td>
                <td>0.828</td>
                <td>0.836</td>
                <td>0.818</td>
                <td>0.854</td>
                <td>0.844</td>
                <td>0.037</td>
              </tr>
              <tr valign="top">
                <td>UE-en-2</td>
                <td>0.745</td>
                <td>0.821</td>
                <td>0.809</td>
                <td>0.861</td>
                <td>0.838</td>
                <td>0.786</td>
                <td>0.800</td>
                <td>0.040</td>
              </tr>
              <tr valign="top">
                <td>UE-en-3</td>
                <td>0.739</td>
                <td>0.820</td>
                <td>0.815</td>
                <td>0.870</td>
                <td>0.851</td>
                <td>0.776</td>
                <td>0.795</td>
                <td>0.040</td>
              </tr>
              <tr valign="top">
                <td>AKBL-en-2</td>
                <td>0.734</td>
                <td>0.819</td>
                <td>0.799</td>
                <td>0.832</td>
                <td>0.808</td>
                <td>0.806</td>
                <td>0.793</td>
                <td>0.042</td>
              </tr>
              <tr valign="top">
                <td>AKBL-en-3</td>
                <td>0.716</td>
                <td>0.804</td>
                <td>0.787</td>
                <td>0.853</td>
                <td>0.834</td>
                <td>0.760</td>
                <td>0.747</td>
                <td>0.043</td>
              </tr>
              <tr valign="top">
                <td>NTTMU-en-1</td>
                <td>0.619</td>
                <td>0.770</td>
                <td>0.777</td>
                <td>0.734</td>
                <td>0.733</td>
                <td>0.809</td>
                <td>0.835</td>
                <td>0.056</td>
              </tr>
              <tr valign="top">
                <td>AKBL-en-1</td>
                <td>0.613</td>
                <td>0.772</td>
                <td>0.755</td>
                <td>0.656</td>
                <td>0.649</td>
                <td>0.936</td>
                <td>0.945</td>
                <td>0.065</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table7fn1">
              <p><sup>a</sup>The system ID comprises the group ID (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>), the abbreviation of subtask (en indicates English subtask), and the system number from 1 to 3 since each group can submit three systems per subtask.</p>
            </fn>
            <fn id="table7fn2">
              <p><sup>b</sup>The results are ordered by exact match accuracy.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table8">
          <label>Table 8</label>
          <caption>
            <p>Performance in the Chinese subtask (6 participating systems and 2 baseline systems).</p>
          </caption>
          <table width="100%" cellpadding="7" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="41*"/>
            <col width="36*"/>
            <col width="21*"/>
            <col width="22*"/>
            <col width="25*"/>
            <col width="22*"/>
            <col width="22*"/>
            <col width="29*"/>
            <col width="39*"/>
            <thead>
              <tr valign="top">
                <td rowspan="2">System ID<sup>a</sup></td>
                <td rowspan="2">Exact match<sup>b</sup></td>
                <td colspan="2">F1</td>
                <td colspan="2">Precision</td>
                <td colspan="2">Recall</td>
                <td rowspan="2">Hamming loss</td>
              </tr>
              <tr valign="top">
                <td>Micro</td>
                <td>Macro</td>
                <td>Micro</td>
                <td>Macro</td>
                <td>Micro</td>
                <td>Macro</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>NAIST-zh-2</td>
                <td>0.880</td>
                <td>0.920</td>
                <td>0.906</td>
                <td>0.899</td>
                <td>0.887</td>
                <td>0.941</td>
                <td>0.925</td>
                <td>0.019</td>
              </tr>
              <tr valign="top">
                <td>NAIST-zh-3</td>
                <td>0.878</td>
                <td>0.919</td>
                <td>0.904</td>
                <td>0.899</td>
                <td>0.885</td>
                <td>0.940</td>
                <td>0.924</td>
                <td>0.019</td>
              </tr>
              <tr valign="top">
                <td>NAIST-zh-1</td>
                <td>0.877</td>
                <td>0.918</td>
                <td>0.904</td>
                <td>0.899</td>
                <td>0.887</td>
                <td>0.938</td>
                <td>0.921</td>
                <td>0.020</td>
              </tr>
              <tr valign="top">
                <td>TUA1-zh-3</td>
                <td>0.786</td>
                <td>0.860</td>
                <td>0.844</td>
                <td>0.772</td>
                <td>0.760</td>
                <td>0.970</td>
                <td>0.971</td>
                <td>0.037</td>
              </tr>
              <tr valign="top">
                <td>SVM-unigram</td>
                <td>0.780</td>
                <td>0.858</td>
                <td>0.843</td>
                <td>0.831</td>
                <td>0.815</td>
                <td>0.888</td>
                <td>0.883</td>
                <td>0.034</td>
              </tr>
              <tr valign="top">
                <td>TUA1-zh-1</td>
                <td>0.773</td>
                <td>0.853</td>
                <td>0.838</td>
                <td>0.766</td>
                <td>0.753</td>
                <td>0.963</td>
                <td>0.965</td>
                <td>0.039</td>
              </tr>
              <tr valign="top">
                <td>SVM-bigram</td>
                <td>0.767</td>
                <td>0.850</td>
                <td>0.835</td>
                <td>0.824</td>
                <td>0.806</td>
                <td>0.878</td>
                <td>0.876</td>
                <td>0.036</td>
              </tr>
              <tr valign="top">
                <td>TUA1-zh-2</td>
                <td>0.719</td>
                <td>0.824</td>
                <td>0.809</td>
                <td>0.712</td>
                <td>0.710</td>
                <td>0.978</td>
                <td>0.982</td>
                <td>0.049</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table8fn1">
              <p><sup>a</sup>The system ID comprises the group ID (see <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>), the abbreviation of subtask (zh indicates Chinese subtask), and the system number from 1 to 3 since each group can submit 3 systems per subtask.</p>
            </fn>
            <fn id="table8fn2">
              <p><sup>b</sup> The results are ordered by exact match accuracy.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>One of the most valuable findings was that we could determine the best strategy for disease surveillance. The best system of the NAIST group had 2 characteristics: (1) cross-language features and (2) ensemble of multiple machine learning methods.</p>
        <sec>
          <title>Cross-Language Features</title>
          <p>For each language, the NAIST system utilized features from the other 2 languages. English and Chinese sentences were translated from a Japanese sentence, indicating that these 3 sentences shared the same symptom label set. Only the NAIST system focused on the property of this task’s corpus and improved the accuracy from 0.767 to 0.823 in exact match.</p>
        </sec>
        <sec>
          <title>Ensemble Methods</title>
          <p>The NAIST system also utilized an ensemble method, which combines multiple methods to boost the classification accuracy. Although weak machine learning algorithms tend to be generally preferred to make an ensemble, the NAIST group created an ensemble consisting of strong machine learning methods: a hierarchical attention network and a deep convolutional neural network (CNN). The combination of methods varied the exact match accuracy of 0.836 at the minimum to 0.880 at the maximum. In the near future, a technique to find a better combination needs to be developed.</p>
          <p>Out of the 2 features, the cross-language feature is the unique feature of this task. Even if we discounted the cross-language feature, the NAIST ensemble method exhibited the best performance. As the multi-label classification is known as a complex task, the performance of straightforward approaches relying only on 1 method was relatively lower than that of the NAIST system.</p>
          <p>Note that previous NTCIR medical tasks and MedNLP workshops [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref15">15</xref>] have shown that a rule-based approach is still competitive with machine learning approaches. One of the reasons for this was the small size of the corpus they used. Although the corpus size was also limited in this task, this result showed the advantage of complex machine learning, indicating the advancement of machine learning techniques.</p>
        </sec>
      </sec>
      <sec>
        <title>Subtask-Based Comparison</title>
        <p>The MedWeb task provided a cross-language corpus. Although this is another characteristic of this task, only 1 group (NAIST) challenged all subtasks, which was lesser than our expectation. The Japanese subtask had the highest participation (19 systems from 8 groups), whereas the Chinese subtask had the lowest participation (6 systems from only 2 groups), which was also lower than our expectation.</p>
        <p>The performance varied depending on the subtasks. <xref ref-type="fig" rid="figure1">Figure 1</xref> shows the distribution of the 3 metric scores of the systems in each subtask. For the Japanese subtask, the performance varied widely, relative to that of the other subtasks. Although the Chinese subtask had the lowest participation, their performance was relatively high. The 4 groups that participated in the Japanese subtask also challenged the English subtask, with better results, on average, in the English subtask. This indicates that the difficulty of classification in increasing order is Chinese, English, and Japanese. This is a surprising result because most of the groups came from Japan and must have been familiar with the Japanese NLP.</p>
        <p>This indicates that the Chinese language has less ambiguity in clinical factuality analyses. Another possibility is that the process we used to generate the corpora had a language bias. For example, the translations from Japanese to English and Chinese might have reduced the ambiguity of the language in each case. To test for language bias, experiments based on different directions of translation are necessary. This is left for future work. Note that the baseline systems performed the best in the English subtask, indicating that the standard settings for SVM are effective in terms of classifying English tweets.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>The corpora provided by the MedWeb task have the following limitations. The first is the generating process of the corpora. For example, our pseudotweets do not include several tweet-specific features such as reply, retweet, hashtag, and URL. In addition, the translation process might bias the results. Although we asked translators to translate Japanese short messages without following standard English or Chinese as they could, some of them would be more formal than tweets.</p>
        <p>Another limitation is the size of each corpus (1920 messages are used as training data and 640 messages are used as test data). Regardless of these limitations, we believe that this is a valuable attempt to generate and share a cross-language corpus consisting of multi-label pseudotweets.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Statistical summary of the performance of 3 evaluation metrics (A: Exact math accuracy, B: F1-micro, and C: Hamming loss) in each of the subtasks (ja: Japanese, en: English, and zh: Chinese). Note that higher scores are better in exact match accuracy and F1-micro, whereas lower scores are better in hamming loss. The bottom and top of a box are the first and third quartiles, the band inside the box is the median, and the dotted band inside the box is the mean. Dots on the right side of the box represent the distribution of values of participating systems.</p>
          </caption>
          <graphic xlink:href="jmir_v21i2e12783_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Although our corpus has some limitations, we still believe it is helpful as a benchmark for tweet-based applications, because it is freely available and covers multiple languages.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>Currently, several shared tasks related to medical or health care have already been held. In the United States, the i2b2 tasks [<xref ref-type="bibr" rid="ref3">3</xref>] were organized by the National Institute of Health [<xref ref-type="bibr" rid="ref54">54</xref>] to enhance the ability of NLP tools to extract fine-grained information from clinical records. Specifically, i2b2 has provided sets of fully deidentified notes and proposed several challenges, such as deidentification and heart disease risk factor challenge, temporal relation challenge, conference challenge, relation challenge, medication challenge, obesity challenge, and deidentification and smoking challenge.</p>
        <p>In addition, the TREC Medical Records Track (TREC2011-2012) [<xref ref-type="bibr" rid="ref4">4</xref>] was established for the research community to focus on the problem of providing content-based access to free text fields of electronic health records. Then, Clinical Decision Support/Precision Medicine Tracks (TREC2014-2018) [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref9">9</xref>] were organized in TREC. The Clinical Decision Support Track focused on the retrieval of biomedical articles relevant for answering generic clinical questions about medical records, and TREC Precision Medicine Track focused on a use case in clinical decision support, providing useful precision medicine-related information to clinicians treating cancer patients.</p>
        <p>Furthermore, the CLEF eHealth [<xref ref-type="bibr" rid="ref10">10</xref>] focused on NLP and information retrieval for clinical care in the European Union. In Japan, NTCIR Medical tasks and MedNLP workshops (MedNLP-1, MedNLP-2, and MedNLP-Doc) [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref16">16</xref>] were organized to promote and support the generation of practical tools and systems applicable in the medical industry, which will support medical decisions and treatments by physicians and medical staff. MedNLP-1 [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref14">14</xref>] aimed to retrieve important information (personal and medical) from the clinical text written in Japanese. MedNLP-2 [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref15">15</xref>] challenged to extract information from medical reports written by physicians and from past medical exams. MedNLP-Doc [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref16">16</xref>] proposed a task to guess the name of the disease (represented by the International Codes for Diseases [ICD]) from the provided medical records. However, to the best of our knowledge, the MedWeb is the first shared task for dealing with health-related social media data.</p>
        <p>Due to the widespread use of the internet, considerable material concerning medical care or health has been made available on the Web, especially social media such as Twitter and Facebook. Furthermore, various Web mining techniques for utilizing the material have been developed. One of the most popular medical applications is disease surveillance, which aims to predict disease epidemics based on the use of disease-related terms. Particularly, influenza surveillance using social media has been extensively studied [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]. As most previous studies have relied on shallow textual clues in messages, such as the number of occurrences of specific keywords (eg, <italic>flu</italic> or <italic>influenza</italic>), there are several noisy messages. To filter out noisy tweets, a binary classifier has been employed. In contrast, the MedWeb has challenged a more difficult and practical task of performing a multi-label classification of cross-language user-generated messages.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This paper provided an overview of the NTCIR-13 MedWeb task, which was designed as a more generalized task for public surveillance, focusing on social media (such as Twitter). In particular, the task’s goal was to classify symptom-related messages. This task had 2 characteristics: (1) multi-label (cold, cough, diarrhea, fever, hay fever, headache, flu, and runny nose) and (2) cross-language (Japanese, English, and Chinese). The results empirically demonstrated that an ensemble of multiple machine learning methods was effective in terms of classification of cross-language messages with multiple labels. We believe that the findings would be a foundation for future and deeper approaches for disease surveillance with social media data.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <app id="app1">
        <title>Multimedia Appendix 1</title>
        <p>Organization of groups participating in MedWeb and statistics of result submissions. Note that it is listed in alphabetical order by Group ID, and ja, en, and zh correspond to Japanese, English, and Chinese subtasks, respectively.</p>
        <media xlink:href="jmir_v21i2e12783_app1.pdf" xlink:title="PDF File (Adobe PDF File), 20KB"/>
      </app>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">CLEF</term>
          <def>
            <p>Cross-Language Evaluation Forum for European Languages</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CNN</term>
          <def>
            <p>convolutional neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">i2b2</term>
          <def>
            <p>Informatics for Integrating Biology and the Bedside</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ICD</term>
          <def>
            <p>International Codes for Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">MedNLP</term>
          <def>
            <p>Medical Natural Language Processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">MedWeb</term>
          <def>
            <p>Medical natural language processing for Web document</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">NTCIR</term>
          <def>
            <p>NII Testbeds and Community for Information access Research</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">SVM</term>
          <def>
            <p>support vector machine</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">TREC</term>
          <def>
            <p>Text Retrieval Conference</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by the Japan Agency for Medical Research and Development (Grant Number: JP16768699) and JST ACT-I (JPMJPR16UU). The authors appreciate annotators in Social Computing laboratory at Nara Institute of Science and Technology for their efforts on generating the corpus. The authors also greatly appreciate the NTCIR-13 chairs for their efforts on organizing the NTCIR-13 workshop. Finally, the authors thank all participants for their contributions to the NTCIR-13 MedWeb task.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>SW, MM, YK, TO, and EA organized the shared task; SW and EA created the data; SW and EA analyzed the results; and SW, MM, YK, TO, and EA prepared the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Boonstra</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Versluis</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Vos</surname>
            <given-names>JF</given-names>
          </name>
        </person-group>
        <article-title>Implementing electronic health records in hospitals: a systematic literature review</article-title>
        <source>BMC Health Serv Res</source>  
        <year>2014</year>  
        <month>09</month>  
        <day>4</day>  
        <volume>14</volume>  
        <fpage>370</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://bmchealthservres.biomedcentral.com/articles/10.1186/1472-6963-14-370"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1186/1472-6963-14-370</pub-id>
        <pub-id pub-id-type="medline">25190184</pub-id>
        <pub-id pub-id-type="pii">1472-6963-14-370</pub-id>
        <pub-id pub-id-type="pmcid">PMC4162964</pub-id></nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hsiao</surname>
            <given-names>CJ</given-names>
          </name>
          <name name-style="western">
            <surname>Hing</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Use and characteristics of electronic health record systems among office-based physician practices: United States, 2001-2012</article-title>
        <source>NCHS Data Brief</source>  
        <year>2012</year>  
        <month>12</month>  
        <issue>111</issue>  
        <fpage>1</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/nchs/data/databriefs/db111.pdf"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1097/01.sa.0000451505.72517.a5</pub-id>
        <pub-id pub-id-type="medline">23384787</pub-id></nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
        <source>i2b2: Informatics for Integrating Biology &amp; the Bedside</source>  
        <access-date>2019-01-20</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.i2b2.org/index.html">https://www.i2b2.org/index.html</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="75a8EIuUR"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Voorhees</surname>
            <given-names>EM</given-names>
          </name>
          <name name-style="western">
            <surname>Hersh</surname>
            <given-names>W</given-names>
          </name>
        </person-group>
        <source>National Institute of Standards and Technology</source>  
        <year>2013</year>  
        <month>06</month>  
        <day>28</day>  
        <access-date>2019-01-22</access-date>
        <comment>Overview of the TREC 2012 Medical Records Track 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://ws680.nist.gov/publication/get_pdf.cfm?pub_id=913781">https://ws680.nist.gov/publication/get_pdf.cfm?pub_id=913781</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75cJJI0KS"/></comment> </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="web">
        <source>TREC Precision Medicine / Clinical Decision Support Track</source>  
        <access-date>2019-01-21</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.trec-cds.org/">http://www.trec-cds.org/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="75aKpBWwa"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Simpson</surname>  
        <given-names>MS</given-names></name>  
        <name name-style="western">
        <surname>Voorhees</surname>  
        <given-names>EM</given-names></name>  
        <name name-style="western">
        <surname>Hersh</surname>  
        <given-names>W</given-names></name> </person-group>
        <article-title>Overview of the TREC 2014 Clinical Decision Support Track</article-title>
        <source>NIST Special Publication 500-308: The Twenty-Third Text REtrieval Conference Proceedings (TREC 2014)</source>  
        <year>2014</year>  
        <month>11</month>  
        <conf-name>TREC 2014</conf-name>
        <conf-date>November 18-21, 2014</conf-date>
        <conf-loc>Gaithersburg, MD</conf-loc>
        <fpage>1</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://trec.nist.gov/pubs/trec23/papers/overview-clinical.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Roberts</surname>  
        <given-names>K</given-names></name>  
        <name name-style="western">
        <surname>Simpson</surname>  
        <given-names>MS</given-names></name>  
        <name name-style="western">
        <surname>Voorhees</surname>  
        <given-names>EM</given-names></name>  
        <name name-style="western">
        <surname>Hersh</surname>  
        <given-names>WR</given-names></name> </person-group>
        <article-title>Overview of the TREC 2015 Clinical Decision Support Track</article-title>
        <source>NIST Special Publication: SP 500-319: Proceedings of the Twenty-Fourth Text REtrieval Conference (TREC 2015)</source>  
        <year>2015</year>  
        <month>11</month>  
        <conf-name>TREC 2015</conf-name>
        <conf-date>November 17–20, 2015</conf-date>
        <conf-loc>Gaithersburg, MD</conf-loc>
        <fpage>1</fpage>  
        <lpage>12</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://trec.nist.gov/pubs/trec24/papers/Overview-CL.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Roberts</surname>  
        <given-names>K</given-names></name>  
        <name name-style="western">
        <surname>Demner-Fushman</surname>  
        <given-names>D</given-names></name>  
        <name name-style="western">
        <surname>Voorhees</surname>  
        <given-names>EM</given-names></name>  
        <name name-style="western">
        <surname>Hersh</surname>  
        <given-names>WR</given-names></name> </person-group>
        <article-title>Overview of the TREC 2016 Clinical Decision Support Track</article-title>
        <source>NIST Special Publication: SP 500-321: Proceedings of the Twenty-Fifth Text REtrieval Conference (TREC 2016)</source>  
        <year>2016</year>  
        <month>11</month>  
        <conf-name>TREC 2016</conf-name>
        <conf-date>November 15–18, 2016</conf-date>
        <conf-loc>Gaithersburg, MD</conf-loc>
        <fpage>1</fpage>  
        <lpage>14</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://trec.nist.gov/pubs/trec25/papers/Overview-CL.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Roberts</surname>  
        <given-names>K</given-names></name>  
        <name name-style="western">
        <surname>Demner-Fushman</surname>  
        <given-names>D</given-names></name>  
        <name name-style="western">
        <surname>Voorhees</surname>  
        <given-names>EM</given-names></name>  
        <name name-style="western">
        <surname>Hersh</surname>  
        <given-names>WR</given-names></name>  
        <name name-style="western">
        <surname>Bedrick</surname>  
        <given-names>S</given-names></name>  
        <name name-style="western">
        <surname>Lazar</surname>  
        <given-names>AJ</given-names></name>  
        <name name-style="western">
        <surname>Pant</surname>  
        <given-names>S</given-names></name> </person-group>
        <article-title>Overview of the TREC 2017 Precision Medicine Track</article-title>
        <source>NIST Special Publication: SP 500-324: Proceedings of the Twenty-Sixth Text REtrieval Conference (TREC 2017)</source>  
        <year>2017</year>  
        <month>11</month>  
        <conf-name>TREC 2017</conf-name>
        <conf-date>November 15–17, 2017</conf-date>
        <conf-loc>Gaithersburg, MD</conf-loc>
        <fpage>1</fpage>  
        <lpage>13</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://trec.nist.gov/pubs/trec26/papers/Overview-PM.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <collab>CLEF eHealth Evaluation Lab</collab>
        </person-group>
        <source>CLEF eHealth</source>  
        <access-date>2019-01-21</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://sites.google.com/site/clefehealth/home">https://sites.google.com/site/clefehealth/home</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="75aIciOBv"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Morita</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Aramaki</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Kano</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Miyabe</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Ohkuma</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <source>Sociocom</source>  
        <access-date>2019-01-21</access-date>
        <comment>About NTCIR-10 “Medical Natural Language Processing (MedNLP)” Pilot Task 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://sociocom.jp/~mednlp/medistj-en/index.html">http://sociocom.jp/~mednlp/medistj-en/index.html</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75aJauZEE"/></comment> </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Aramaki</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Morita</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Kano</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Ohkuma</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <source>NTCIR11 MedNLP 2</source>  
        <access-date>2019-01-21</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://sociocom.jp/~mednlp/ntcir11/index-ja.html">http://sociocom.jp/~mednlp/ntcir11/index-ja.html</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="75aJRWq5j"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Aramaki</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Morita</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Kano</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Ohkuma</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <source>MedNLPDoc</source>  
        <access-date>2019-01-21</access-date>
        <comment>NTCIR MEDNLPDOC (MEDNLP-3) 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://sites.google.com/site/mednlpdoc/">https://sites.google.com/site/mednlpdoc/</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75aJ90OXu"/></comment> </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Morita</surname>  
        <given-names>M</given-names></name>  
        <name name-style="western">
        <surname>Kano</surname>  
        <given-names>Y</given-names></name>  
        <name name-style="western">
        <surname>Ohkuma</surname>  
        <given-names>T</given-names></name>  
        <name name-style="western">
        <surname>Miyabe</surname>  
        <given-names>M</given-names></name>  
        <name name-style="western">
        <surname>Aramaki</surname>  
        <given-names>E</given-names></name> </person-group>
        <article-title>Overview of the NTCIR-10 MedNLP Task</article-title>
        <source>Proceedings of the 10th NTCIR Conference</source>  
        <year>2013</year>  
        <month>06</month>  
        <conf-name>NTCIR-10 Conference</conf-name>
        <conf-date>June 18-21, 2013</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>696</fpage>  
        <lpage>701</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/workshop/OnlineProceedings10/pdf/NTCIR/MedNLP/01-NTCIR10-OV-MEDNLP-MoritaM.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Aramaki</surname>  
        <given-names>E</given-names></name>  
        <name name-style="western">
        <surname>Morita</surname>  
        <given-names>M</given-names></name>  
        <name name-style="western">
        <surname>Kano</surname>  
        <given-names>Y</given-names></name>  
        <name name-style="western">
        <surname>Ohkuma</surname>  
        <given-names>T</given-names></name> </person-group>
        <article-title>Overview of the NTCIR-11 MedNLP-2 Task</article-title>
        <source>Proceedings of the 11th NTCIR Conference</source>  
        <year>2014</year>  
        <month>12</month>  
        <conf-name>NTCIR-11 Conference</conf-name>
        <conf-date>December 9-12, 2014</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>147</fpage>  
        <lpage>54</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/workshop/OnlineProceedings11/pdf/NTCIR/OVERVIEW/01-NTCIR11-OV-MEDNLP-AramakiE.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Aramaki</surname>  
        <given-names>E</given-names></name>  
        <name name-style="western">
        <surname>Morita</surname>  
        <given-names>M</given-names></name>  
        <name name-style="western">
        <surname>Kano</surname>  
        <given-names>Y</given-names></name>  
        <name name-style="western">
        <surname>Ohkuma</surname>  
        <given-names>T</given-names></name> </person-group>
        <article-title>Overview of the NTCIR-12 MedNLPDoc Task</article-title>
        <source>Proceedings of the 12th NTCIR Conference on Evaluation of Information Access Technologies</source>  
        <year>2016</year>  
        <month>06</month>  
        <conf-name>NTCIR-12 Conference on Evaluation of Information Access Technologies</conf-name>
        <conf-date>June 7-10, 2016</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>71</fpage>  
        <lpage>75</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/workshop/OnlineProceedings12/pdf/ntcir/OVERVIEW/01-NTCIR12-OV-MEDNLPDOC-AramakiE.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Polgreen</surname>
            <given-names>PM</given-names>
          </name>
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Pennock</surname>
            <given-names>DM</given-names>
          </name>
          <name name-style="western">
            <surname>Nelson</surname>
            <given-names>FD</given-names>
          </name>
        </person-group>
        <article-title>Using internet searches for influenza surveillance</article-title>
        <source>Clin Infect Dis</source>  
        <year>2008</year>  
        <month>12</month>  
        <day>1</day>  
        <volume>47</volume>  
        <issue>11</issue>  
        <fpage>1443</fpage>  
        <lpage>8</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.cid.oxfordjournals.org/cgi/pmidlookup?view=long&amp;pmid=18954267"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1086/593098</pub-id>
        <pub-id pub-id-type="medline">18954267</pub-id></nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Culotta</surname>  
        <given-names>A</given-names></name> </person-group>
        <article-title>Towards Detecting Influenza Epidemics by Analyzing Twitter Messages</article-title>
        <source>Proceedings of the First Workshop on Social Media Analytics</source>  
        <year>2010</year>  
        <month>07</month>  
        <conf-name>SOMA'10</conf-name>
        <conf-date>July 25-28, 2010</conf-date>
        <conf-loc>Washington DC, District of Columbia</conf-loc>
        <publisher-name>ACM</publisher-name>
        <fpage>115</fpage>  
        <lpage>22</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/citation.cfm?id=1964874&amp;dl=ACM&amp;coll=DL"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Aramaki</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Maskawa</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Morita</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>Twitter Catches the Flu: Detecting Influenza Epidemics Using Twitter</article-title>
        <source>Proceedings of the Conference on Empirical Methods in Natural Language Processing</source>  
        <year>2011</year>  
        <month>07</month>  
        <conf-name>EMNLP'11</conf-name>
        <conf-date>July 27–31, 2011</conf-date>
        <conf-loc>Edinburgh, Scotland, UK</conf-loc>
        <fpage>1568</fpage>  
        <lpage>76</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dl.acm.org/citation.cfm?id=2145432.2145600"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Signorini</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Segre</surname>
            <given-names>AM</given-names>
          </name>
          <name name-style="western">
            <surname>Polgreen</surname>
            <given-names>PM</given-names>
          </name>
        </person-group>
        <article-title>The use of Twitter to track levels of disease activity and public concern in the US during the influenza A H1N1 pandemic</article-title>
        <source>PLoS One</source>  
        <year>2011</year>  
        <month>05</month>  
        <day>4</day>  
        <volume>6</volume>  
        <issue>5</issue>  
        <fpage>e19467</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0019467"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0019467</pub-id>
        <pub-id pub-id-type="medline">21573238</pub-id>
        <pub-id pub-id-type="pii">PONE-D-10-02464</pub-id>
        <pub-id pub-id-type="pmcid">PMC3087759</pub-id></nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Achrekar</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Gandhe</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Lazarus</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>B</given-names>
          </name>
        </person-group>
        <source>University of Massachusetts Lowell</source>  
        <year>2012</year>  
        <month>02</month>  
        <access-date>2019-01-22</access-date>
        <comment>Twitter improves Seasonal Influenza Prediction 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.cs.uml.edu/~hachreka/SNEFT/images/healthinf_2012.pdf">http://www.cs.uml.edu/~hachreka/SNEFT/images/healthinf_2012.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75cOHwa9E"/></comment> </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lamb</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <source>The Association for Computational Linguistics</source>  
        <year>2013</year>  
        <access-date>2019-01-22</access-date>
        <comment>Separating Fact from Fear: Tracking Flu Infections on Twitter 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.aclweb.org/anthology/N13-1097">http://www.aclweb.org/anthology/N13-1097</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75cOPDkio"/></comment> </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Gesualdo</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Stilo</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Agricola</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Gonfiantini</surname>
            <given-names>MV</given-names>
          </name>
          <name name-style="western">
            <surname>Pandolfi</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Velardi</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Tozzi</surname>
            <given-names>AE</given-names>
          </name>
        </person-group>
        <article-title>Influenza-like illness surveillance on Twitter through automated learning of naïve language</article-title>
        <source>PLoS One</source>  
        <year>2013</year>  
        <volume>8</volume>  
        <issue>12</issue>  
        <fpage>e82489</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0082489"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0082489</pub-id>
        <pub-id pub-id-type="medline">24324799</pub-id>
        <pub-id pub-id-type="pii">PONE-D-13-24070</pub-id>
        <pub-id pub-id-type="pmcid">PMC3853203</pub-id></nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Broniatowski</surname>
            <given-names>DA</given-names>
          </name>
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>National and local influenza surveillance through Twitter: an analysis of the 2012-2013 influenza epidemic</article-title>
        <source>PLoS One</source>  
        <year>2013</year>  
        <volume>8</volume>  
        <issue>12</issue>  
        <fpage>e83672</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0083672"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0083672</pub-id>
        <pub-id pub-id-type="medline">24349542</pub-id>
        <pub-id pub-id-type="pii">PONE-D-13-35058</pub-id>
        <pub-id pub-id-type="pmcid">PMC3857320</pub-id></nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Paul</surname>
            <given-names>MJ</given-names>
          </name>
          <name name-style="western">
            <surname>Dredze</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Broniatowski</surname>
            <given-names>D</given-names>
          </name>
        </person-group>
        <article-title>Twitter improves influenza forecasting</article-title>
        <source>PLoS Curr</source>  
        <year>2014</year>  
        <month>10</month>  
        <day>28</day>  
        <volume>6</volume>  
        <issue>5</issue>  
        <fpage>225</fpage>  
        <lpage>6</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.1371/currents.outbreaks.90b9ed0f59bae4ccaa683a39865d9117"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/currents.outbreaks.90b9ed0f59bae4ccaa683a39865d9117</pub-id>
        <pub-id pub-id-type="medline">25642377</pub-id>
        <pub-id pub-id-type="pmcid">PMC4234396</pub-id></nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Charles-Smith</surname>
            <given-names>LE</given-names>
          </name>
          <name name-style="western">
            <surname>Reynolds</surname>
            <given-names>TL</given-names>
          </name>
          <name name-style="western">
            <surname>Cameron</surname>
            <given-names>MA</given-names>
          </name>
          <name name-style="western">
            <surname>Conway</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Lau</surname>
            <given-names>EH</given-names>
          </name>
          <name name-style="western">
            <surname>Olsen</surname>
            <given-names>JM</given-names>
          </name>
          <name name-style="western">
            <surname>Pavlin</surname>
            <given-names>JA</given-names>
          </name>
          <name name-style="western">
            <surname>Shigematsu</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Streichert</surname>
            <given-names>LC</given-names>
          </name>
          <name name-style="western">
            <surname>Suda</surname>
            <given-names>KJ</given-names>
          </name>
          <name name-style="western">
            <surname>Corley</surname>
            <given-names>CD</given-names>
          </name>
        </person-group>
        <article-title>Using social media for actionable disease surveillance and outbreak management: a systematic literature review</article-title>
        <source>PLoS One</source>  
        <year>2015</year>  
        <month>10</month>  
        <volume>10</volume>  
        <issue>10</issue>  
        <fpage>e0139701</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.plos.org/10.1371/journal.pone.0139701"/>
        </comment>  
        <pub-id pub-id-type="doi">10.1371/journal.pone.0139701</pub-id>
        <pub-id pub-id-type="medline">26437454</pub-id>
        <pub-id pub-id-type="pii">PONE-D-15-21599</pub-id>
        <pub-id pub-id-type="pmcid">PMC4593536</pub-id></nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Iso</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Wakamiya</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Aramaki</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <source>The Association for Computational Linguistics</source>  
        <year>2016</year>  
        <access-date>2019-01-22</access-date>
        <comment>Forecasting Word Model: Twitter-based Influenza Surveillance and Prediction 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.aclweb.org/anthology/C16-1008">http://www.aclweb.org/anthology/C16-1008</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75cOYLTHS"/></comment> </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
        <source>NTCIR</source>  
        <access-date>2019-01-21</access-date>
        <comment>NTCIR-13 Conference 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/ntcir-13/conference.html">http://research.nii.ac.jp/ntcir/ntcir-13/conference.html</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75aHh6YcI"/></comment> </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Aramaki</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Wakamiya</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Morita</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Kano</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Ohkuma</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <source>NTCIR-13 MedWeb</source>  
        <access-date>2019-01-21</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://mednlp.jp/medweb/NTCIR-13/">http://mednlp.jp/medweb/NTCIR-13/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="75aHyBXJK"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Wakamiya</surname>  
        <given-names>S</given-names></name>  
        <name name-style="western">
        <surname>Morita</surname>  
        <given-names>M</given-names></name>  
        <name name-style="western">
        <surname>Kano</surname>  
        <given-names>Y</given-names></name>  
        <name name-style="western">
        <surname>Ohkuma</surname>  
        <given-names>T</given-names></name>  
        <name name-style="western">
        <surname>Aramaki</surname>  
        <given-names>E</given-names></name> </person-group>
        <article-title>Overview of the NTCIR-13: MedWeb Task</article-title>
        <source>Proceedings of the 13th NTCIR Conference on Evaluation of Information Access Technologies</source>  
        <year>2017</year>  
        <month>12</month>  
        <conf-name>NTCIR-13 Conference</conf-name>
        <conf-date>December 5-8, 2017</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>40</fpage>  
        <lpage>49</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://tinyurl.com/y4w4sckt"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
        <source>Twitter</source>  
        <access-date>2019-01-21</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://twitter.com/">https://twitter.com/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="75aIADN5x"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
        <source>Facebook</source>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.facebook.com/">https://www.facebook.com/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="75aIfrC4W"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Sakai</surname>  
        <given-names>M</given-names></name>  
        <name name-style="western">
        <surname>Tanioka</surname>  
        <given-names>H</given-names></name> </person-group>
        <article-title>Keyword-based Challenges at the NTCIR-13 MedWeb</article-title>
        <source>Proceedings of the 13th NTCIR Conference on Evaluation of Information Access Technologies</source>  
        <year>2017</year>  
        <month>12</month>  
        <conf-name>NTCIR-13 Conference</conf-name>
        <conf-date>December 5-8, 2017</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>50</fpage>  
        <lpage>51</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/workshop/OnlineProceedings13/pdf/ntcir/02-NTCIR13-MEDWEB-SakaiM.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
        <name name-style="western">
        <surname>Asakawa</surname>  
        <given-names>R</given-names></name>  
        <name name-style="western">
        <surname>Akiba</surname>  
        <given-names>T</given-names></name> </person-group>
        <article-title>AKBL at the NTCIR-13 MedWeb Task</article-title>
        <source>Proceedings of the 13th NTCIR Conference on Evaluation of Information Access Technologies</source>  
        <year>2017</year>  
        <month>12</month>  
        <conf-name>NTCIR-13 Conference</conf-name>
        <conf-date>December 5-8, 2017</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>52</fpage>  
        <lpage>55</lpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/workshop/OnlineProceedings13/pdf/ntcir/03-NTCIR13-MEDWEB-AsakawaR.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Morita</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Takagi</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <article-title>DrG at NTCIR-13: MedWeb Task</article-title>
        <source>Proceedings of the 13th NTCIR Conference on Evaluation of Information Access Technologies</source>  
        <year>2017</year>  
        <month>12</month>  
        <conf-name>NTCIR-13 Conference</conf-name>
        <conf-date>December 5-8, 2017</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>81</fpage>  
        <lpage>4</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/workshop/OnlineProceedings13/pdf/ntcir/10-NTCIR13-MEDWEB-MoritaK.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Sakishita</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Kano</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <article-title>Classification of Tweet Posters for Diseases by Combined Rule-Based and Machine Learning Method in NTCIR-13: MedWeb Twitter Task (Japanese Subtask)</article-title>
        <source>Proceedings of the 13th NTCIR Conference on Evaluation of Information Access Technologies</source>  
        <year>2017</year>  
        <month>12</month>  
        <conf-name>NTCIR-13 Conference</conf-name>
        <conf-date>December 5-8, 2017</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>62</fpage>  
        <lpage>4</lpage>
         <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/workshop/OnlineProceedings13/pdf/ntcir/05-NTCIR13-MEDWEB-SakishitaM.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Iso</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Ruiz</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Murayama</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Taguchi</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Takeuchi</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Yamamoto</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Wakamiya</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Aramaki</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>NTCIR13 MedWeb Task: Multi-label Classification of Tweets using an Ensemble of Neural Networks</article-title>
        <source>Proceedings of the 13th NTCIR Conference on Evaluation of Information Access Technologies</source>  
        <year>2017</year>  
        <month>12</month>  
        <conf-name>NTCIR-13 Conference</conf-name>
        <conf-date>December 5-8, 2017</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>56</fpage>  
        <lpage>61</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/workshop/OnlineProceedings13/pdf/ntcir/04-NTCIR13-MEDWEB-IsoH.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Ito</surname>
            <given-names>M</given-names>
          </name>
        </person-group>
        <article-title>NIL: Using scoring to analyse the ambiguous messages on the NTCIR-13 MedWeb task</article-title>
        <source>Proceedings of the 13th NTCIR Conference on Evaluation of Information Access Technologies</source>  
        <year>2017</year>  
        <month>12</month>  
        <conf-name>NTCIR-13 Conference</conf-name>
        <conf-date>December 5-8, 2017</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>74</fpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/workshop/OnlineProceedings13/pdf/ntcir/08-NTCIR13-MEDWEB-ItoM.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Lin</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Dai</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Shao</surname>
            <given-names>J</given-names>
          </name>
        </person-group>
        <article-title>Principle Base Approach for Classifying Tweets with Flu-related Information in NTCIR-13 MedWeb Task</article-title>
        <source>Proceedings of the 13th NTCIR Conference on Evaluation of Information Access Technologies</source>  
        <year>2017</year>  
        <month>12</month>  
        <conf-name>NTCIR-13 Conference</conf-name>
        <conf-date>December 5-8, 2017</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>71</fpage>  
        <lpage>73</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/workshop/OnlineProceedings13/pdf/ntcir/07-NTCIR13-MEDWEB-LinJ.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>C</given-names>
          </name>
          <name name-style="western">
            <surname>Kang</surname>
            <given-names>X</given-names>
          </name>
          <name name-style="western">
            <surname>Ren</surname>
            <given-names>F</given-names>
          </name>
        </person-group>
        <article-title>Medweb Task: Identify Multi-Symptoms from Tweets Based on Active Learning and Semantic Information</article-title>
        <source>Proceedings of the 13th NTCIR Conference on Evaluation of Information Access Technologies</source>  
        <year>2017</year>  
        <month>12</month>  
        <conf-name>NTCIR-13 Conference</conf-name>
        <conf-date>December 5-8, 2017</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>75</fpage>  
        <lpage>80</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/workshop/OnlineProceedings13/pdf/ntcir/09-NTCIR13-MEDWEB-LiC.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Hang</surname>
            <given-names>N</given-names>
          </name>
          <name name-style="western">
            <surname>Kobayashi</surname>
            <given-names>H</given-names>
          </name>
          <name name-style="western">
            <surname>Quaresma</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Sawai</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <article-title>UE and Nikon at the NTCIR-13 MedWeb Task</article-title>
        <source>Proceedings of the 13th NTCIR Conference on Evaluation of Information Access Technologies</source>  
        <year>2017</year>  
        <month>12</month>  
        <conf-name>NTCIR-13 Conference</conf-name>
        <conf-date>December 5-9, 2017</conf-date>
        <conf-loc>Tokyo, Japan</conf-loc>
        <fpage>65</fpage>  
        <lpage>70</lpage>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/workshop/OnlineProceedings13/pdf/ntcir/06-NTCIR13-MEDWEB-TranA.pdf"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="web">
        <source>Twitter Developer Platform</source>  
        <access-date>2019-01-21</access-date>
        <comment>Developer Agreement and Policy 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://developer.twitter.com/en/developer-terms/agreement-and-policy.html">https://developer.twitter.com/en/developer-terms/agreement-and-policy.html</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75aHAkMpb"/></comment> </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
        <source>Twitter Developer Platform</source>  
        <access-date>2019-01-21</access-date>
        <comment>API Docs 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://developer.twitter.com/en/docs.html">https://developer.twitter.com/en/docs.html</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75aHSWKV3"/></comment> </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
        <source>NTCIR-13 MedWeb</source>  
        <year>2018</year>  
        <month>07</month>  
        <day>23</day>  
        <access-date>2018-08-23</access-date>
        <comment>NTCIR-13 MedWeb (Medical Natural Language Processing for Web Document) 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://research.nii.ac.jp/ntcir/permission/ntcir-13/perm-en-MedWeb.html">http://research.nii.ac.jp/ntcir/permission/ntcir-13/perm-en-MedWeb.html</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="71sPdfSWe"/></comment> </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Aramaki</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Wakamiya</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Morita</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Kano</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Ohkuma</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <source>Figshare</source>  
        <year>2018</year>  
        <month>04</month>  
        <day>02</day>  
        <access-date>2019-01-21</access-date>
        <comment>NTCIR-13 MedWeb Annotation Corpus Guideline (English Ver 2.0) 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://figshare.com/articles/NTCIR-13_MedWeb_Annotation_Corpus_Guideline_English_Ver_2_0_/6072812">https://figshare.com/articles/NTCIR-13_MedWeb_Annotation_Corpus_Guideline_English_Ver_2_0_/6072812</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75aGzBMsz"/></comment> </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Aramaki</surname>
            <given-names>E</given-names>
          </name>
          <name name-style="western">
            <surname>Wakamiya</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Morita</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Kano</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Ohkuma</surname>
            <given-names>T</given-names>
          </name>
        </person-group>
        <source>Figshare</source>  
        <year>2018</year>  
        <month>04</month>  
        <day>2</day>  
        <access-date>2019-01-21</access-date>
        <comment>NTCIR-13 MedWeb Annotation Corpus Guideline (Japanese Ver 2.0) 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://figshare.com/articles/NTCIR-13_MedWeb_Annotation_Corpus_Guideline_Japanese_Ver_2_0_/6072821">https://figshare.com/articles/NTCIR-13_MedWeb_Annotation_Corpus_Guideline_Japanese_Ver_2_0_/6072821</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75aGfxygF"/></comment> </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Kudo</surname>
            <given-names>T</given-names>
          </name>
          <name name-style="western">
            <surname>Yamamoto</surname>
            <given-names>K</given-names>
          </name>
          <name name-style="western">
            <surname>Matsumoto</surname>
            <given-names>Y</given-names>
          </name>
        </person-group>
        <source>ACL Anthology Reference Corpus</source>  
        <year>2014</year>  
        <month>07</month>  
        <access-date>2019-01-22</access-date>
        <comment>Applying conditional random fields to Japanese morphological analysis 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://acl-arc.comp.nus.edu.sg/archives/acl-arc-090501d4/data/pdf/anthology-PDF/W/W04/W04-3230.pdf">http://acl-arc.comp.nus.edu.sg/archives/acl-arc-090501d4/data/pdf/anthology-PDF/W/W04/W04-3230.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75cOn2Nsj"/></comment> </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="confproc">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Bird</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <article-title>NLTK: The Natural Language Toolkit</article-title>
        <source>Proceedings of the COLING/ACL 2006 Interactive Presentation Sessions</source>  
        <year>2006</year>  
        <month>07</month>  
        <conf-name>COLING/ACL 2006</conf-name>
        <conf-date>July 17–21, 2006</conf-date>
        <conf-loc>Sydney, Australia</conf-loc>
        <fpage>69</fpage>  
        <lpage>72</lpage> </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="web">
        <source>Natural Language Toolkit—NLTK 3.4 documentation</source>  
        <access-date>2019-01-21</access-date>
        <comment>nltk.tokenize package 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.nltk.org/api/nltk.tokenize.html">http://www.nltk.org/api/nltk.tokenize.html</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75aGQkD2p"/></comment> </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Junyi</surname>
            <given-names>S</given-names>
          </name>
        </person-group>
        <source>GitHub</source>  
        <access-date>2014-01-27</access-date>
        <comment>jieba 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/fxsjy/jieba">https://github.com/fxsjy/jieba</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6MvXve9OT"/></comment> </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="web">
        <source>scikit-learn: Machine Learning in Python</source>  
        <access-date>2018-11-04</access-date>
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://scikit-learn.org/stable/">http://scikit-learn.org/stable/</ext-link>
          <ext-link ext-link-type="webcite" xlink:href="73eSO5vZc"/>
        </comment> </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="web">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Pedregosa</surname>
            <given-names>F</given-names>
          </name>
          <name name-style="western">
            <surname>Varoquaux</surname>
            <given-names>G</given-names>
          </name>
          <name name-style="western">
            <surname>Gramfort</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Michel</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Thirion</surname>
            <given-names>B</given-names>
          </name>
          <name name-style="western">
            <surname>Grisel</surname>
            <given-names>O</given-names>
          </name>
          <name name-style="western">
            <surname>Blondel</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Prettenhofer</surname>
            <given-names>P</given-names>
          </name>
          <name name-style="western">
            <surname>Weiss</surname>
            <given-names>R</given-names>
          </name>
          <name name-style="western">
            <surname>Dubourg</surname>
            <given-names>V</given-names>
          </name>
          <name name-style="western">
            <surname>Vanderplas</surname>
            <given-names>J</given-names>
          </name>
          <name name-style="western">
            <surname>Passos</surname>
            <given-names>A</given-names>
          </name>
          <name name-style="western">
            <surname>Cournapeau</surname>
            <given-names>D</given-names>
          </name>
          <name name-style="western">
            <surname>Brucher</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Perrot</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Duchesnay</surname>
            <given-names>É</given-names>
          </name>
        </person-group>
        <source>Journal of Machine Learning Research</source>  
        <year>2011</year>  
        <month>10</month>  
        <day>11</day>  
        <access-date>2019-01-22</access-date>
        <comment>Scikit-learn: Machine Learning in Python 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmlr.org/papers/volume12/pedregosa11a/pedregosa11a.pdf">http://www.jmlr.org/papers/volume12/pedregosa11a/pedregosa11a.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="75cFEGrlb"/></comment> </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>M</given-names>
          </name>
          <name name-style="western">
            <surname>Zhou</surname>
            <given-names>Z</given-names>
          </name>
        </person-group>
        <article-title>A review on multi-label learning algorithms</article-title>
        <source>IEEE Trans Knowl Data Eng</source>  
        <year>2014</year>  
        <month>8</month>  
        <volume>26</volume>  
        <issue>8</issue>  
        <fpage>1819</fpage>  
        <lpage>37</lpage>  
        <pub-id pub-id-type="doi">10.1109/TKDE.2013.39</pub-id></nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="web">
        <source>National Institutes of Health</source>  
        <access-date>2018-03-30</access-date>
        <comment>Turning Discovery into Health 
        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nih.gov/sites/default/files/about-nih/discovery-into-health/nih-turning-discovery-into-health.pdf">https://www.nih.gov/sites/default/files/about-nih/discovery-into-health/nih-turning-discovery-into-health.pdf</ext-link>
        <ext-link ext-link-type="webcite" xlink:href="6yIXFi28d"/></comment> </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
        <person-group person-group-type="author">
          <name name-style="western">
            <surname>Wakamiya</surname>
            <given-names>S</given-names>
          </name>
          <name name-style="western">
            <surname>Kawai</surname>
            <given-names>Y</given-names>
          </name>
          <name name-style="western">
            <surname>Aramaki</surname>
            <given-names>E</given-names>
          </name>
        </person-group>
        <article-title>Twitter-based influenza detection after flu peak via tweets with indirect information: text mining study</article-title>
        <source>JMIR Public Health Surveill</source>  
        <year>2018</year>  
        <month>09</month>  
        <day>25</day>  
        <volume>4</volume>  
        <issue>3</issue>  
        <fpage>e65</fpage>  
        <comment>
          <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" ext-link-type="uri" xlink:type="simple" xlink:href="http://publichealth.jmir.org/2018/3/e65/"/>
        </comment>  
        <pub-id pub-id-type="doi">10.2196/publichealth.8627</pub-id>
        <pub-id pub-id-type="medline">30274968</pub-id>
        <pub-id pub-id-type="pii">v4i3e65</pub-id>
        <pub-id pub-id-type="pmcid">PMC6231889</pub-id></nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
