<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v25i1e49400</article-id>
      <article-id pub-id-type="pmid">37902815</article-id>
      <article-id pub-id-type="doi">10.2196/49400</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Early Warning and Prediction of Scarlet Fever in China Using the Baidu Search Index and Autoregressive Integrated Moving Average With Explanatory Variable (ARIMAX) Model: Time Series Analysis</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Walker</surname>
            <given-names>Mark</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Khairulbahri</surname>
            <given-names>Muhamad</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhao</surname>
            <given-names>Chenhao</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wang</surname>
            <given-names>Yongbin</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Luo</surname>
            <given-names>Tingyan</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7668-315X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Zhou</surname>
            <given-names>Jie</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6164-3649</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Jing</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0175-6470</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Xie</surname>
            <given-names>Yulan</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0003-6448-6572</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Wei</surname>
            <given-names>Yiru</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-1272-7348</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Mai</surname>
            <given-names>Huanzhuo</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6095-8809</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>Dongjia</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-0232-1846</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Yuecong</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6412-8121</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Cui</surname>
            <given-names>Ping</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7195-2832</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Ye</surname>
            <given-names>Li</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7688-4867</ext-link>
        </contrib>
        <contrib id="contrib11" contrib-type="author">
          <name name-style="western">
            <surname>Liang</surname>
            <given-names>Hao</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7534-5124</ext-link>
        </contrib>
        <contrib id="contrib12" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Huang</surname>
            <given-names>Jiegang</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>School of Public Health</institution>
            <institution>Guangxi Medical University</institution>
            <addr-line>22 Shuangyong Road, Qingxiu District</addr-line>
            <addr-line>Nanning, 530021</addr-line>
            <country>China</country>
            <phone>86 07715334215</phone>
            <email>jieganghuang@gxmu.edu.cn</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3271-1694</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>School of Public Health</institution>
        <institution>Guangxi Medical University</institution>
        <addr-line>Nanning</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Guangxi Key Laboratory of AIDS Prevention and Treatment</institution>
        <institution>Guangxi Medical University</institution>
        <addr-line>Nanning</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Life Science Institute</institution>
        <institution>Guangxi Medical University</institution>
        <addr-line>Nanning</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Guangxi Colleges and Universities Key Laboratory of Prevention and Control of Highly Prevalent Disease</institution>
        <institution>Guangxi Medical University</institution>
        <addr-line>Nanning</addr-line>
        <country>China</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Jiegang Huang <email>jieganghuang@gxmu.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>30</day>
        <month>10</month>
        <year>2023</year>
      </pub-date>
      <volume>25</volume>
      <elocation-id>e49400</elocation-id>
      <history>
        <date date-type="received">
          <day>27</day>
          <month>5</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>25</day>
          <month>7</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>23</day>
          <month>8</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>26</day>
          <month>9</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Tingyan Luo, Jie Zhou, Jing Yang, Yulan Xie, Yiru Wei, Huanzhuo Mai, Dongjia Lu, Yuecong Yang, Ping Cui, Li Ye, Hao Liang, Jiegang Huang. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 30.10.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2023/1/e49400" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Internet-derived data and the autoregressive integrated moving average (ARIMA) and ARIMA with explanatory variable (ARIMAX) models are extensively used for infectious disease surveillance. However, the effectiveness of the Baidu search index (BSI) in predicting the incidence of scarlet fever remains uncertain.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>Our objective was to investigate whether a low-cost BSI monitoring system could potentially function as a valuable complement to traditional scarlet fever surveillance in China.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>ARIMA and ARIMAX models were developed to predict the incidence of scarlet fever in China using data from the National Health Commission of the People’s Republic of China between January 2011 and August 2022. The procedures included establishing a keyword database, keyword selection and filtering through Spearman rank correlation and cross-correlation analyses, construction of the scarlet fever comprehensive search index (CSI), modeling with the training sets, predicting with the testing sets, and comparing the prediction performances.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The average monthly incidence of scarlet fever was 4462.17 (SD 3011.75) cases, and annual incidence exhibited an upward trend until 2019. The keyword database contained 52 keywords, but only 6 highly relevant ones were selected for modeling. A high Spearman rank correlation was observed between the scarlet fever reported cases and the scarlet fever CSI (r<sub>s</sub>=0.881). We developed the ARIMA(4,0,0)(0,1,2)<sub>(12)</sub> model, and the ARIMA(4,0,0)(0,1,2)<sub>(12)</sub> + CSI (Lag=0) and ARIMAX(1,0,2)(2,0,0)<sub>(12)</sub> models were combined with the BSI. The 3 models had a good fit and passed the residuals Ljung-Box test. The ARIMA(4,0,0)(0,1,2)<sub>(12)</sub>, ARIMA(4,0,0)(0,1,2)<sub>(12)</sub> + CSI (Lag=0), and ARIMAX(1,0,2)(2,0,0)<sub>(12)</sub> models demonstrated favorable predictive capabilities, with mean absolute errors of 1692.16 (95% CI 584.88-2799.44), 1067.89 (95% CI 402.02-1733.76), and 639.75 (95% CI 188.12-1091.38), respectively; root mean squared errors of 2036.92 (95% CI 929.64-3144.20), 1224.92 (95% CI 559.04-1890.79), and 830.80 (95% CI 379.17-1282.43), respectively; and mean absolute percentage errors of 4.33% (95% CI 0.54%-8.13%), 3.36% (95% CI –0.24% to 6.96%), and 2.16% (95% CI –0.69% to 5.00%), respectively. The ARIMAX models outperformed the ARIMA models and had better prediction performances with smaller values.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study demonstrated that the BSI can be used for the early warning and prediction of scarlet fever, serving as a valuable supplement to traditional surveillance systems.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>scarlet fever</kwd>
        <kwd>Baidu search index</kwd>
        <kwd>autoregressive integrated moving average</kwd>
        <kwd>ARIMA</kwd>
        <kwd>warning</kwd>
        <kwd>prediction</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Scarlet fever is an acute respiratory contagious disease caused by group A <italic>Streptococcus pyogenes</italic> infection and is classified as a category B notifiable infectious disease in China [<xref ref-type="bibr" rid="ref1">1</xref>]. It is a seasonal disease that typically occurs during winter and spring, and no vaccine is currently available for prevention. Carriers and patients with scarlet fever are the primary sources of infection, which occurs mainly through airborne droplets. The population is generally susceptible, with children and adolescents being particularly vulnerable [<xref ref-type="bibr" rid="ref2">2</xref>]. Clinical symptoms in infected patients are characterized by fever, pharyngitis, a diffuse bright red rash over the body, and skin flaking after the rash has disappeared [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. The global incidence of scarlet fever has increased significantly since 2011, particularly in China, where a study has shown that the average annual incidence of scarlet fever between 2011 and 2016 was twice as high as that between 2004 and 2011 [<xref ref-type="bibr" rid="ref5">5</xref>]. The resurgence of scarlet fever has emerged as a significant global public health issue [<xref ref-type="bibr" rid="ref6">6</xref>]. Therefore, in order to comprehend the pattern and trend of scarlet fever outbreaks and facilitate the rational allocation of public health resources in China, a reliable prediction method is needed to identify the recent mode of the scarlet fever epidemic.</p>
      <p>Currently, the autoregressive integrated moving average (ARIMA) model is one of the most commonly used time series methods and is extensively used in the early warning of infectious diseases [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>]. The occurrence of scarlet fever exhibits seasonality and temporal correlation. The ARIMA model is capable of capturing such cyclic patterns and accounting for autocorrelation in time series data, thereby enhancing predictive precision. The emergence of disease is typically orchestrated by a confluence of diverse factors. By incorporating a multitude of exogenous variables, the ARIMA with explanatory variables (ARIMAX) model has shown enhanced capability in forecasting and delineating the progression of disease incidence [<xref ref-type="bibr" rid="ref10">10</xref>]. The applicability of the ARIMA model in scarlet fever forecasting and early warning has been substantiated in China [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
      <p>An increasing number of individuals are inclined to search for health-related information on the internet before seeking medical services, opening up the potential for early disease surveillance by monitoring fluctuations in the frequency of specific search keywords [<xref ref-type="bibr" rid="ref11">11</xref>]. Internet-derived data revealed substantial potential in the application of infectious disease surveillance worldwide [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. Google’s influenza monitoring data became available 2 weeks before official announcements in the United States [<xref ref-type="bibr" rid="ref14">14</xref>]. In China, with over 904 million internet users, Baidu has the highest search engine market penetration and is used by over 90% of internet users, making it the most representative tool for measuring user behavior domestically [<xref ref-type="bibr" rid="ref15">15</xref>]. Furthermore, the Baidu search index (BSI) can visually depict the changing trends in keyword search popularity. Studies have indicated that the BSI can be used for the early warning and prediction of communicable diseases, such as dengue fever [<xref ref-type="bibr" rid="ref11">11</xref>], COVID-19 [<xref ref-type="bibr" rid="ref15">15</xref>], and syphilis [<xref ref-type="bibr" rid="ref16">16</xref>], in China.</p>
      <p>However, scarlet fever is relatively underreported compared to influenza, and it is still unknown whether the BSI can enhance the predictive and early warning capacity for scarlet fever. Therefore, we developed an ARIMA model with scarlet fever cases and multiple ARIMAX models incorporating the BSI to investigate whether a low-cost, internet-based monitoring system can effectively complement traditional scarlet fever surveillance in China and provide a scientific basis for formulating strategies and policies for the prevention and control of infectious diseases.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethical Considerations</title>
        <p>Data were obtained from the public National Health Commission of the People’s Republic of China database [<xref ref-type="bibr" rid="ref17">17</xref>] and the researchers did not have access to individual patient details. The medical research ethics committee of the Guangxi Medical University determined that this research did not require ethics approval according to the following Chinese law: Notice by the National Health Commission, the Ministry of Education, the Ministry of Science and Technology, and the National Administration of Traditional Chinese Medicine of Issuing the Measures for Ethical Review of Life Science and Medical Research Involving Human Being (No. 4 of the National Health Commission, 2023).</p>
      </sec>
      <sec>
        <title>Data Sources</title>
        <sec>
          <title>Epidemiological Data for Scarlet Fever</title>
          <p>This study used monthly reported data from the National Health Commission of the People’s Republic of China [<xref ref-type="bibr" rid="ref17">17</xref>] covering 140 months from January 2011 to August 2022. The data is publicly available for research purposes, no personal information is involved, and the collection of monthly reported data has been fully completed.</p>
        </sec>
        <sec>
          <title>BSI Data</title>
          <p>We obtained real-time search data and keywords for the same period from the BSI [<xref ref-type="bibr" rid="ref18">18</xref>]. The keyword search index was based on the volume of information search queries conducted by Baidu search users and achieved through a corresponding calculation process. We collected data for relevant keywords spanning from January 2011 to August 2022 and converted them into monthly counts for subsequent analysis using Microsoft Excel 2019 (Microsoft Corporation).</p>
        </sec>
      </sec>
      <sec>
        <title>Keyword Selection and Analysis</title>
        <sec>
          <title>Establishing a Keyword Database</title>
          <p>The effectiveness of the model in predicting outbreaks using internet-derived data relies on selecting appropriate keywords for model fitting. Thus, selecting relevant keywords is crucial for ensuring accurate model fitting. Keywords related to scarlet fever with complete time series were collected using the following three approaches: (1) obtaining scarlet fever–related syndrome words using the ChinaZ website [<xref ref-type="bibr" rid="ref19">19</xref>], (2) obtaining words related to scarlet fever according to the Baidu index demand map [<xref ref-type="bibr" rid="ref20">20</xref>], and (3) mining keywords using semantic analysis of scarlet fever through the Baidu encyclopedia [<xref ref-type="bibr" rid="ref21">21</xref>] and the Baidu health medical dictionary [<xref ref-type="bibr" rid="ref22">22</xref>]. Eventually, the keywords were divided into 4 categories in Microsoft Excel 2019, namely, scarlet fever comprehensive category, etiology, symptoms, and prevention and treatment [<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref25">25</xref>].</p>
        </sec>
        <sec>
          <title>Keyword Exclusion Criteria</title>
          <p>Keywords were excluded based on the following criteria: (1) keywords irrelevant to the epidemic or clinical information of scarlet fever, (2) keywords with a Spearman rank correlation (r<sub>s</sub>) &#60;0.6 between scarlet fever reported cases and the BSI or <italic>P&#62;</italic>.05 [<xref ref-type="bibr" rid="ref26">26</xref>], and (3) keywords with a maximum cross-correlation coefficient &#60;0.5 [<xref ref-type="bibr" rid="ref27">27</xref>]. The analyses were performed using SPSS 26.0 (IBM).</p>
        </sec>
      </sec>
      <sec>
        <title>Construction of the Comprehensive Search Index</title>
        <p>After the correlation analysis, a scarlet fever comprehensive search index (CSI) [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>] was calculated as follows:</p>
        <disp-formula>
          <graphic xlink:href="jmir_v25i1e49400_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </disp-formula>
        <p>where k is potential time lag in months, n is the number of keywords contained in each time lag, <sub>ki</sub> is the Spearman correlation coefficient for keyword i with a specific time lag k, and weight<sub>ki</sub> and keyword<sub>ki</sub> are the keyword’s weight and BSI in a lag period, respectively.</p>
      </sec>
      <sec>
        <title>Model Construction and Evaluation</title>
        <sec>
          <title>Model Description</title>
          <p>The ARIMA model is commonly used for forecasting the incidence of scarlet fever. Considering the time autocorrelation between the data points and the seasonal transmission pattern of scarlet fever, the model expression is ARIMA(p,d,q)(P,D,Q)<sub>(S)</sub> [<xref ref-type="bibr" rid="ref10">10</xref>], where d and D represent the nonseasonal and seasonal difference orders, respectively; p and q represent the autoregressive and moving average orders, respectively; P and Q represent the seasonal autoregressive and moving average orders, respectively; and S is the period of the sequence [<xref ref-type="bibr" rid="ref8">8</xref>]. ARIMAX is a multivariable version of ARIMA that combined scarlet fever reported cases with the scarlet fever CSI, thus using the BSI as the external variable [<xref ref-type="bibr" rid="ref26">26</xref>]. The construction and evaluation of the model were performed using R 4.2.0 (R Foundation for Statistical Computing), following the described process.</p>
        </sec>
        <sec>
          <title>Stationarity Tests for Time Series</title>
          <p>We plotted the time series of scarlet fever reported cases and the scarlet fever CSI to observe long-term trends from January 2011 to August 2022. The stationarity was tested using the augmented Dickey-Fuller (ADF) and Ljung-Box tests [<xref ref-type="bibr" rid="ref10">10</xref>]. Nonstationary sequences were transformed into stationary sequences by difference and exponential transformation.</p>
        </sec>
        <sec>
          <title>Splitting the Training and Testing Sets</title>
          <p>Based on the stationary sequences, we divided the scarlet fever reported cases and the CSI data into the training sets for model construction running from January 2011 to August 2021 and the testing sets for model prediction running from September 2021 to August 2022. To evaluate the impact of the COVID-19 pandemic on scarlet fever, we conducted a subgroup analysis with the training sets running from January 2011 to December 2018 and the testing sets running from January 2019 to August 2022.</p>
        </sec>
        <sec>
          <title>Model Selection</title>
          <p>We used the scarlet fever reported cases training set to construct the ARIMA model, and both the scarlet fever reported cases and CSI training sets for the ARIMAX model. We used the <italic>auto.arima</italic> function for automatic selection and manual selection through examination of the autocorrelation function (ACF) and partial autocorrelation function (PACF) plots. First, the ARIMA and ARIMAX models were based on the <italic>auto.arima</italic> function and the minimum Akaike information criterion (AIC). Next, the orders and ranges of the ARIMA model were determined based on the ACF and PACF plots. We performed multiple fittings and searched for the optimal ARIMA(p,d,q)(P,D,Q)<sub>(S)</sub> model using the minimum AIC [<xref ref-type="bibr" rid="ref26">26</xref>]. Then, we plotted the cross-correlation function (CCF) plot between scarlet fever and the CSI to determine the appropriate lag order for the ARIMAX model [<xref ref-type="bibr" rid="ref8">8</xref>]. If the coefficient for a specific lag order exceeded 2 SD, the CSI at that lag order was considered correlated with scarlet fever. Finally, all models were tested using the least squares method (LSM; <italic>P</italic>&#60;.05 indicated model estimation was significant) and parameter estimation (<italic>P</italic>&#60;.05 indicated a statistically significant parameter). The model diagnosis was performed using the residuals Ljung-Box test (<italic>P</italic>&#62;.05 indicated the model variables were independent) [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. After passing the tests, the models proceeded to the prediction section.</p>
        </sec>
        <sec>
          <title>Evaluation of the Model Fit</title>
          <p>The model fit was assessed using R<sup>2</sup>, AIC, root mean square error (RMSE), mean absolute error (MAE), and mean absolute percentage error (MAPE). A higher R<sup>2</sup> value and lower values of the remaining variables indicated a better fit of the model.</p>
        </sec>
        <sec>
          <title>Evaluation of the Model Prediction</title>
          <p>The ARIMA and ARIMAX models were used for predicting the incidence of scarlet fever with the testing sets, and the predictions were compared to the actual incidence. We evaluated the model prediction effects through MAE, RMSE, and MAPE. Smaller values indicated better predictions. The flow chart of this study is shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>. All tests were 2-sided, and <italic>P&#60;</italic>.05 indicated significance.</p>
          <fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Research flowchart. ACF: autocorrelation function; ARIMA: autoregressive integrated moving average; ARIMAX: autoregressive integrated moving average with explanatory variable; PACF: partial autocorrelation function.</p>
            </caption>
            <graphic xlink:href="jmir_v25i1e49400_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Descriptive Analysis</title>
        <p>From January 2011 to August 2022, the average monthly incidence of scarlet fever was 4462.17 (SD 3011.75) cases, with an annual incidence of 53,546.06 cases. The annual incidence of scarlet fever showed an upward trend until 2019, reaching a peak of 83,028 cases in 2019. The keyword database comprised 52 keywords categorized into the following categories: scarlet fever comprehensive category, etiology, symptoms, and prevention and treatment (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
      </sec>
      <sec>
        <title>Correlation Analysis Between the Baidu Search Index and Scarlet Fever</title>
        <p>The results of the Spearman rank correlation analysis revealed a strong temporal correlation between 6 keywords from the BSI and scarlet fever reported cases (r<sub>s</sub>&#62;0.6; <xref ref-type="table" rid="table1">Table 1</xref>). The remaining keywords showed weak correlation or no statistical difference. Plotting the time series of high-correlation keywords, such as “猩红热症状 (symptoms of scarlet fever)” (<xref rid="figure2" ref-type="fig">Figure 2</xref>A) and “猩红热传染吗 (Is scarlet fever contagious?)” (<xref rid="figure2" ref-type="fig">Figure 2</xref>B), and comparing them with scarlet fever reported cases, the overall trends of the two keywords were consistent with the actual incidence.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Spearman rank correlation analysis between the monthly Baidu search index keywords and scarlet fever reported cases.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="490"/>
            <col width="190"/>
            <col width="120"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td>Keywords<sup>a</sup></td>
                <td>r<sub>s</sub><sup>b</sup></td>
                <td><italic>P</italic> value</td>
                <td>Search volume, mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>猩红热传染吗 (Is scarlet fever contagious?)</td>
                <td>0.834</td>
                <td>&#60;.001</td>
                <td>182.197 (89.909)</td>
              </tr>
              <tr valign="top">
                <td>猩红热症状 (symptoms of scarlet fever)</td>
                <td>0.818</td>
                <td>&#60;.001</td>
                <td>565.129 (330.355)</td>
              </tr>
              <tr valign="top">
                <td>猩红热图片 (scarlet fever pictures)</td>
                <td>0.750</td>
                <td>&#60;.001</td>
                <td>235.494 (111.399)</td>
              </tr>
              <tr valign="top">
                <td>猩红热 (scarlet fever)</td>
                <td>0.746</td>
                <td>&#60;.001</td>
                <td>1482.185 (634.117)</td>
              </tr>
              <tr valign="top">
                <td>猩红热症状图片 (scarlet fever symptoms pictures)</td>
                <td>0.698</td>
                <td>&#60;.001</td>
                <td>77.723 (49.489)</td>
              </tr>
              <tr valign="top">
                <td>猩红热的症状 (scarlet fever symptoms)</td>
                <td>0.649</td>
                <td>&#60;.001</td>
                <td>92.044 (37.554)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Keywords were presented in a Chinese (English) format.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>r<sub>s</sub>: Spearman rank correlation.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Time series between scarlet fever reported cases and (A) the keywords “symptoms of scarlet fever,” (B) the keywords “Is scarlet fever contagious?” or (C) the scarlet fever comprehensive search index.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e49400_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Cross-Correlation Analysis and the CSI</title>
        <p>Cross-correlation analysis was performed between keywords with r<sub>s</sub>&#62;0.6 and scarlet fever reported cases. We selected 6 keywords with a maximum cross-correlation coefficient &#62;0.5 (<italic>P</italic>&#60;.001) within the lag range (<xref ref-type="table" rid="table2">Table 2</xref>). We calculated the weight of each keyword using a formula and used the weight to construct the scarlet fever CSI by aggregating the BSI of each keyword. Spearman rank correlation analysis showed a high correlation between scarlet fever reported cases and the scarlet fever CSI (r<sub>s</sub>=0.881).</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Cross-correlation analysis between scarlet fever reported cases and Baidu search index keywords.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="250"/>
            <col width="250"/>
            <thead>
              <tr valign="top">
                <td>Keywords<sup>a</sup></td>
                <td>Lag (months)</td>
                <td>Maximum CCF<sup>b</sup> (SE)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>猩红热传染吗 (Is scarlet fever contagious?)</td>
                <td>0</td>
                <td>0.813 (0.088)</td>
              </tr>
              <tr valign="top">
                <td>猩红热 (scarlet fever)</td>
                <td>0</td>
                <td>0.827 (0.088)</td>
              </tr>
              <tr valign="top">
                <td>猩红热症状 (symptoms of scarlet fever)</td>
                <td>0</td>
                <td>0.809 (0.088)</td>
              </tr>
              <tr valign="top">
                <td>猩红热图片 (scarlet fever pictures)</td>
                <td>0</td>
                <td>0.729 (0.088)</td>
              </tr>
              <tr valign="top">
                <td>猩红热症状图片 (scarlet fever symptoms pictures)</td>
                <td>0</td>
                <td>0.678 (0.088)</td>
              </tr>
              <tr valign="top">
                <td>猩红热的症状 (scarlet fever symptoms)</td>
                <td>0</td>
                <td>0.614 (0.088)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Keywords were presented in a Chinese (English) format.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>CCF: cross-correlation function.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Model Construction and Prediction Evaluation</title>
        <sec>
          <title>Stationarity Tests for Time Series</title>
          <p>Plotting the time series of scarlet fever reported cases and the scarlet fever CSI from January 2011 to August 2022 showed irregular fluctuating patterns (<xref rid="figure2" ref-type="fig">Figure 2</xref>C). The stationarity was tested using the ADF and Ljung-Box tests. The results of the ADF test indicated that the time series of scarlet fever reported cases (<italic>P</italic>=.70) and the scarlet fever CSI (<italic>P</italic>=.90) were nonstationary; they were transformed into stationary series by first order differencing (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>), after which they passed the ADF test (<italic>P</italic>=.01). The 2 series were applied to construct and predict the incidence of scarlet fever based on the Ljung-Box test (<italic>P</italic>&#60;.001).</p>
        </sec>
        <sec>
          <title>Model Selection</title>
          <p>The models ARIMA(4,0,0)(0,1,1)<sub>(12)</sub> and ARIMAX(1,0,2)(2,0,0)<sub>(12)</sub> were constructed according to the <italic>auto.arima</italic> function and the AIC minimum principle.</p>
          <p>The ACF and PACF plots of the stationary scarlet fever series showed that the ACF trailed off and the PACF was truncated at a lag of 4 months (<xref rid="figure3" ref-type="fig">Figure 3</xref>). The ACF plot exhibited a seasonal pattern with a period of 12 months, and the sequence was different by first order and passed the ADF (<italic>P</italic>=.01). Therefore, the parameters of the ARIMA model were p=4, q=0, d=0, D=1, and S=12. The model was fitted using different values for the parameters ranging from 0 to 2 in a stepwise manner from lower to higher orders [<xref ref-type="bibr" rid="ref10">10</xref>]. After conducting combination tests, the model ARIMA(4,0,0)(0,1,2)<sub>(12)</sub> was selected based on the minimum AIC of 1947.03, and the residuals conformed to a white noise sequence (χ<sup>2</sup>=0.145; <italic>P</italic>=.70).</p>
          <p>The CCF plot considered the mutual relationship within a lag of 12 months, revealing that the CSI at a lag of 0 months exhibited the strongest correlation with scarlet fever (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). The stationary time series of CSI at a lag of 0 months was used as the input sequence for constructing the ARIMA(4,0,0)(0,1,2)<sub>(12)</sub> + CSI (Lag=0) and ARIMA(4,0,0)(0,1,1)<sub>(12)</sub> + CSI (Lag=0) models. All the aforementioned models passed the LSM and the residuals Ljung-Box tests (<xref ref-type="table" rid="table3">Table 3</xref>). The results of the model parameter estimation are presented in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. Although not every parameter exhibited significance, the estimated SEs of the parameters were relatively small, indicating minimal variability. Based on the minimum AIC principle and comprehensive evaluation of the fitting metrics (<xref ref-type="table" rid="table3">Table 3</xref>), we finally selected the ARIMA(4,0,0)(0,1,2)<sub>(12)</sub> (Model 1), ARIMA(4,0,0)(0,1,2)<sub>(12)</sub> + CSI (Lag=0) (Model 2), and ARIMAX(1,0,2)(2,0,0)<sub>(12)</sub> (Model 3) models for predictive analysis.</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>The (A) ACF and (B) PACF plots of scarlet fever. ACF: autocorrelation function; PACF: partial autocorrelation function.</p>
            </caption>
            <graphic xlink:href="jmir_v25i1e49400_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <table-wrap position="float" id="table3">
            <label>Table 3</label>
            <caption>
              <p>Evaluation of the model fit and diagnosis.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="0"/>
              <col width="160"/>
              <col width="110"/>
              <col width="100"/>
              <col width="130"/>
              <col width="80"/>
              <col width="0"/>
              <col width="100"/>
              <col width="70"/>
              <col width="80"/>
              <col width="90"/>
              <col width="80"/>
              <thead>
                <tr valign="top">
                  <td colspan="2">Model</td>
                  <td>ADF<sup>a</sup>, <italic>P</italic> value</td>
                  <td colspan="4">Diagnosis</td>
                  <td colspan="5">Fit</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>LSM<sup>b</sup>, <italic>P</italic> value</td>
                  <td colspan="2">Ljung-Box test</td>
                  <td colspan="2">AIC<sup>c</sup><break/>  <break/>  </td>
                  <td>R<sup>2</sup></td>
                  <td>RMSE<sup>d</sup></td>
                  <td>MAE<sup>e</sup></td>
                  <td>MAPE<sup>f</sup></td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>Chi-square</td>
                  <td><italic>P</italic> value</td>
                  <td colspan="2">
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                  <td>
                    <break/>
                  </td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="2">ARIMA(4,0,0)(0,1,2)<sub>(12)</sub></td>
                  <td>.01</td>
                  <td>&#60;.001</td>
                  <td>0.15</td>
                  <td>.70</td>
                  <td colspan="2">1947.03</td>
                  <td>0.87</td>
                  <td>924.6</td>
                  <td>626.44</td>
                  <td>709.00</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">ARIMA(4,0,0)(0,1,2)<sub>(12)</sub> + CSI (Lag=0)</td>
                  <td>.01</td>
                  <td>&#60;.001</td>
                  <td>0.01</td>
                  <td>.94</td>
                  <td colspan="2">1894.89</td>
                  <td>0.91</td>
                  <td>755.76</td>
                  <td>545.01</td>
                  <td>588.56</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">ARIMAX(1,0,2)(2,0,0)<sub>(12)</sub></td>
                  <td>.01</td>
                  <td>&#60;.001</td>
                  <td>0.03</td>
                  <td>.86</td>
                  <td colspan="2">2083.73</td>
                  <td>0.90</td>
                  <td>815.90</td>
                  <td>635.43</td>
                  <td>508.98</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">ARIMA(4,0,0)(0,1,1)<sub>(12)</sub></td>
                  <td>.01</td>
                  <td>&#60;.001</td>
                  <td>0.16</td>
                  <td>.69</td>
                  <td colspan="2">1950.43</td>
                  <td>0.85</td>
                  <td>1006.71</td>
                  <td>694.06</td>
                  <td>876.77</td>
                </tr>
                <tr valign="top">
                  <td colspan="2">ARIMA(4,0,0)(0,1,1)<sub>(12)</sub> + CSI (Lag=0)</td>
                  <td>.01</td>
                  <td>&#60;.001</td>
                  <td>0.01</td>
                  <td>.92</td>
                  <td colspan="2">1893.99</td>
                  <td>0.91</td>
                  <td>779.49</td>
                  <td>563.22</td>
                  <td>643.87</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table3fn1">
                <p><sup>a</sup>ADF: augmented Dickey-Fuller.</p>
              </fn>
              <fn id="table3fn2">
                <p><sup>b</sup>LSM: least squares method.</p>
              </fn>
              <fn id="table3fn3">
                <p><sup>c</sup>AIC: Akaike information criterion.</p>
              </fn>
              <fn id="table3fn4">
                <p><sup>d</sup>RMSE: root mean square error.</p>
              </fn>
              <fn id="table3fn5">
                <p><sup>e</sup>MAE: mean absolute error.</p>
              </fn>
              <fn id="table3fn6">
                <p><sup>f</sup>MAPE: mean absolute percentage error.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>Model Fitting and Diagnosis</title>
          <p>Model 1 (<xref rid="figure4" ref-type="fig">Figure 4</xref>A), Model 2 (<xref rid="figure5" ref-type="fig">Figure 5</xref>A), and Model 3 (<xref rid="figure6" ref-type="fig">Figure 6</xref>A) showed good fitting performances with well-matched fitted and true values. Residual checking was conducted for Model 1 (<xref rid="figure4" ref-type="fig">Figure 4</xref>B-E), Model 2 (<xref rid="figure5" ref-type="fig">Figure 5</xref>B-E), and Model 3 (<xref rid="figure6" ref-type="fig">Figure 6</xref>B-E). The inspection of the residuals revealed the following results: Q-Q plots showed that the residuals followed a normal distribution, residual plots fluctuated around 0, and ACF and PACF plots were almost within the 95% CI. These findings confirmed that the models were suitable for the prediction session.</p>
          <fig id="figure4" position="float">
            <label>Figure 4</label>
            <caption>
              <p>ARIMA(4,0,0)(0,1,2)<sub>(12)</sub> model fitting, diagnosis, and prediction results. (A) Fitting and prediction results. Yellow and black are the fitted and true values of the training sets respectively. Red indicates the true values of the testing sets, and blue indicates the predicted values. (B) Normal Q-Q plot. The solid black line represents the theoretical quantile line. (C) Residual plot. (D) ACF plot. (E) PACF plot. The blue dashed lines in (D) and (E) indicate the confidence interval. ACF: autocorrelation function; ARIMA: autoregressive integrated moving average; PACF: partial autocorrelation function.</p>
            </caption>
            <graphic xlink:href="jmir_v25i1e49400_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>ARIMA(4,0,0)(0,1,2)<sub>(12)</sub>+CSI (Lag=0) model fitting, diagnosis, and prediction results. (A) Fitting and prediction results. Yellow and black are the fitted and true values of the training sets respectively. Red indicates the true values of the testing sets, and blue indicates the predicted values. (B) Normal Q-Q plot. The solid black line represents the theoretical quantile line. (C) Residual plot. (D) ACF plot. (E) PACF plot. The blue dashed lines in (D) and (E) indicate the confidence interval. ACF: autocorrelation function; ARIMA: autoregressive integrated moving average; CSI: comprehensive search index; PACF: partial autocorrelation function.</p>
            </caption>
            <graphic xlink:href="jmir_v25i1e49400_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
          <fig id="figure6" position="float">
            <label>Figure 6</label>
            <caption>
              <p>ARIMAX(1,0,2)(2,0,0)<sub>(12)</sub> model fitting, diagnosis, and prediction results. (A) Fitting and prediction results. Yellow and black are the fitted and true values of the training sets respectively. Red indicates the true values of the testing sets, and blue indicates the predicted values. (B) Normal Q-Q plot. The solid black line represents the theoretical quantile line. (C) Residual plot. (D) ACF plot. (E) PACF plot. The blue dashed lines in (D) and (E) indicate the confidence interval. ACF: autocorrelation function; ARIMAX: autoregressive integrated moving average with explanatory variable; PACF: partial autocorrelation function.</p>
            </caption>
            <graphic xlink:href="jmir_v25i1e49400_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Model Prediction and Evaluation</title>
          <p>The 3 models were used to forecast the incidence of scarlet fever with the testing sets. For Model 1 (<xref rid="figure4" ref-type="fig">Figure 4</xref>A), Model 2 (<xref rid="figure5" ref-type="fig">Figure 5</xref>A), and Model 3 (<xref rid="figure6" ref-type="fig">Figure 6</xref>A), the predicted and true values largely coincided, with the true values falling within the predicted interval. Comparing the performances of the models, the two ARIMAX models incorporating the BSI outperformed the ARIMA model, yielding lower MAE, RMSE, and MAPE values (<xref ref-type="table" rid="table4">Table 4</xref>).</p>
          <table-wrap position="float" id="table4">
            <label>Table 4</label>
            <caption>
              <p>Evaluation of model prediction effectiveness.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="380"/>
              <col width="200"/>
              <col width="200"/>
              <col width="220"/>
              <thead>
                <tr valign="top">
                  <td>Model</td>
                  <td>MAE<sup>a</sup> (95% CI)</td>
                  <td>RMSE<sup>b</sup> (95% CI)</td>
                  <td>MAPE<sup>c</sup>, % (95% CI)</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>ARIMA(4,0,0)(0,1,2)<sub>(12)</sub></td>
                  <td>1692.16 (584.88-2799.44)</td>
                  <td>2036.92 (929.64-3144.20)</td>
                  <td>4.33 (0.54-8.13)</td>
                </tr>
                <tr valign="top">
                  <td>ARIMA(4,0,0)(0,1,2)<sub>(12)</sub> + CSI (Lag=0)</td>
                  <td>1067.89 (402.02-1733.76)</td>
                  <td>1224.92 (559.04-1890.79)</td>
                  <td>3.36 (–0.24 to 6.96)</td>
                </tr>
                <tr valign="top">
                  <td>ARIMAX(1,0,2)(2,0,0)<sub>(12)</sub></td>
                  <td>639.75 (188.12-1091.38)</td>
                  <td>830.80 (379.17-1282.43)</td>
                  <td>2.16 (–0.69 to 5.00)</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table4fn1">
                <p><sup>a</sup>MAE: mean absolute error.</p>
              </fn>
              <fn id="table4fn2">
                <p><sup>b</sup>RMSE: root mean square error.</p>
              </fn>
              <fn id="table4fn3">
                <p><sup>c</sup>MAPE: mean absolute percentage error.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
      </sec>
      <sec>
        <title>Subgroup Analysis</title>
        <p>In the original scarlet fever sequence, a significant decrease was noted in 2020. This decline may be attributed to the widespread outbreak of COVID-19, which could potentially have an impact on the model. To assess the impact of the pandemic on scarlet fever, models were constructed using training sets from 2011 to 2018. Subsequently, we predicted the incidence of scarlet fever in 2019, 2020, 2021, and from January to August 2022, then compared the predictions with the actual incidence. We employed a combination of the <italic>auto.arima</italic> function and ACF with PACF plots to construct the ARIMA(4,0,0)(2,1,0)<sub>(12)</sub> and ARIMAX(0,0,3)(1,0,0)<sub>(12)</sub> models based on the minimum AIC principle. The two models successfully passed the LSM (<italic>P</italic>&#60;.001) and the residuals Ljung-Box (<italic>P</italic>=.93 and <italic>P</italic>=.87, respectively) tests. The fitting and predictive performances of the models are presented in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>.</p>
        <p>The results indicated that the predictive performances of both models declined in 2020 compared to the other years. However, the ARIMAX models, which incorporated the BSI, exhibited enhanced predictive capabilities and partially alleviated the impact of the pandemic.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>Scarlet fever is highly prevalent among children aged 5-15 years. It was the primary cause of mortality among children in the 18th and 19th centuries [<xref ref-type="bibr" rid="ref4">4</xref>]. This study revealed that, from 2011 to 2022, the monthly incidence of scarlet fever was 4462.17 (SD 3011.75) cases, with an annual incidence of 53,546.06 cases. The highest incidence was observed in 2019. Previous studies have demonstrated that scarlet fever underwent a global resurgence with a sharp rise in the United Kingdom, Germany, Korea, and China between 2011 and 2014 [<xref ref-type="bibr" rid="ref28">28</xref>]. Compared to the preoutbreak level, the annual incidence of scarlet fever doubled in China [<xref ref-type="bibr" rid="ref5">5</xref>], tripled in the United Kingdom [<xref ref-type="bibr" rid="ref29">29</xref>], and quadrupled in Korea [<xref ref-type="bibr" rid="ref30">30</xref>]. The resurgence of scarlet fever in China may be related to the rapid economic development, improved living standards, meteorological conditions, and genetic characteristics of the host population [<xref ref-type="bibr" rid="ref31">31</xref>]. The relaxation of the two-child and three-child policies has increased in the susceptible population. The largest study on scarlet fever conducted by Liu et al [<xref ref-type="bibr" rid="ref5">5</xref>] revealed that the elevated incidence of scarlet fever in northern China may be connected to the cold seasons, poor ventilation, and a gradual replacement of emm1 genotypes resulting in a reduction in cross-immunity. As scarlet fever is susceptible to previous cases, prioritizing the improvement of early warning and prediction systems is crucial. There is an urgent need to explore innovative monitoring methods.</p>
      <p>The outbreak of infectious diseases has significant health implications and noticeably impacts health care systems and economies. Certain contagious diseases have high transmission rates and various modes of spread, making them prone to causing widespread epidemics. Thus, it is imperative to promptly identify and implement measures to curb their proliferation from the early stages. Conventional disease surveillance is inherently characterized by a degree of latency, whereas internet-derived data has the potential to offer real-time information, thus enabling the faster detection of early indicators of disease outbreaks. Eysenbach et al [<xref ref-type="bibr" rid="ref32">32</xref>] pioneered a significant precedent in using internet-derived data for disease surveillance. Studies indicated that the BSI can be employed in the early warning and prediction of infectious diseases [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Therefore, we identified 6 keywords associated with scarlet fever. Among these keywords, those that were highly correlated with scarlet fever, such as “symptoms of scarlet fever” and “Is scarlet fever contagious?”, exhibited consistent temporal trends with scarlet fever. Their search volumes changed in accordance with variations in the prevalence of scarlet fever. Spearman rank correlation revealed a strong positive association between the aggregated CSI and scarlet fever (r<sub>s</sub>=0.881), indicating that the BSI can effectively capture variations in scarlet fever epidemics.</p>
      <p>The ARIMA model features low computational complexity, is versatile across various data types, and offers high precision in short-term predicting. This study employed scarlet fever time series data to construct the ARIMA(4,0,0)(0,1,2)<sub>(12)</sub> model, and incorporated the BSI as an external variable to construct the ARIMAX(1,0,2)(2,0,0)<sub>(12)</sub> and ARIMA(4,0,0)(0,1,2)<sub>(12)</sub> + CSI (Lag=0) models. The 3 models exhibited favorable fitting performances, and the ARIMAX models demonstrated superior predictive performances, whether established based on ACF and PACF plots or using the <italic>auto.arima</italic> function. The results were consistent with those for brucellosis [<xref ref-type="bibr" rid="ref26">26</xref>] and dengue fever [<xref ref-type="bibr" rid="ref11">11</xref>], demonstrating the effectiveness and predictive ability of the BSI in monitoring scarlet fever. The BSI provides real-time data that can be accessed promptly, monthly or even daily, whereas the data published by the Chinese official website often incurs delays of several months. These indicators may suggest an impending outbreak of scarlet fever when an unusual surge in vocabulary related to the disease is detected or when the predicted values computed by the model increase. Public health authorities can take proactive measures, prearrange prevention and control strategies, and allocate public health resources rationally.</p>
      <p>The COVID-19 outbreak posed an immense threat to human life and resulted in a worldwide pandemic. The original time series of scarlet fever revealed a substantial decrease in incidence in 2020, potentially influencing the performance of the model. Due to the overlapping symptoms of COVID-19 and scarlet fever, we conducted subgroup analyses to assess the epidemic’s impact and address potential variations. The results exhibited a decline in the model’s predictive performances in 2020, consistent with the findings from Ma et al [<xref ref-type="bibr" rid="ref2">2</xref>]. This decline could be attributed to the containment measures that were implemented, which may have disrupted the transmission pathways of the disease. Moreover, the ARIMAX model, which integrated the BSI, exhibited superior predictive performances, providing additional evidence for the successful use of the BSI concerning scarlet fever.</p>
      <p>This study had several limitations. First, scarlet fever is influenced by a variety of factors, including meteorological conditions, sanitation, and population immunity. This study exclusively used the BSI for analysis, but other factors could be considered in future analyses. Second, internet-derived data is susceptible to the impact of media coverage, possibly resulting in the inclusion of inaccurate information [<xref ref-type="bibr" rid="ref14">14</xref>]. Finally, Baidu search engines do not cover all internet users, and the keywords included in the BSI are not exhaustive. In the future, collaborative efforts with other search engines could be pursued to enhance the predictive capabilities of the model.</p>
      <p>In conclusion, the BSI can be used as a valuable supplement to traditional surveillance systems, providing early warning and prediction capabilities for scarlet fever. Furthermore, it presents novel perspectives and provides a theoretical foundation for the early identification and prediction of infectious diseases, thereby facilitating the timely implementation of public health intervention measures.</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Correlation between monthly Baidu search index keywords and reported cases of scarlet fever from January 2011 to August 2022.</p>
        <media xlink:href="jmir_v25i1e49400_app1.docx" xlink:title="DOCX File , 23 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Stationary series plots after first order differencing.</p>
        <media xlink:href="jmir_v25i1e49400_app2.png" xlink:title="PNG File , 122 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>The CCF between scarlet fever and the comprehensive search index. Blue dashed lines indicate the 95% CI. CCF: cross-correlation function.</p>
        <media xlink:href="jmir_v25i1e49400_app3.png" xlink:title="PNG File , 28 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Parameter estimation of candidate models.</p>
        <media xlink:href="jmir_v25i1e49400_app4.docx" xlink:title="DOCX File , 19 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Evaluation of the model fit, diagnosis, and prediction. AIC: Akaike information criterion; LSM: least squares method; MAE: mean absolute error; RMSE: root mean square error; MAPE: mean absolute percentage error.</p>
        <media xlink:href="jmir_v25i1e49400_app5.docx" xlink:title="DOCX File , 14 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ACF</term>
          <def>
            <p>autocorrelation function</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ADF</term>
          <def>
            <p>augmented Dickey-Fuller</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">AIC</term>
          <def>
            <p>Akaike information criterion</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">ARIMA</term>
          <def>
            <p>autoregressive integrated moving average</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ARIMAX</term>
          <def>
            <p>autoregressive integrated moving average with explanatory variable</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">BSI</term>
          <def>
            <p>Baidu search index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">CCF</term>
          <def>
            <p>cross-correlation function</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">CSI</term>
          <def>
            <p>comprehensive search index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">LSM</term>
          <def>
            <p>least squares method</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">MAE</term>
          <def>
            <p>mean absolute error</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">MAPE</term>
          <def>
            <p>mean absolute percentage error</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">PACF</term>
          <def>
            <p>partial autocorrelation function</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">RMSE</term>
          <def>
            <p>root mean square error</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This research was supported by the National Natural Science Foundation of China (grants 82273694 and 82060366) and the Innovation Project of Guangxi Graduate Education (grant YCBZ2022098).</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>TL conducted the formal analysis and writing (drafting and revising). JH, TL, and JZ contributed to the conception and design of the study and additional analysis. JY, YX, YW, HM, DL, and YY performed data collection and review and the primary analysis. PC, LY, and HL were involved in conceptualization and supervision. JH supervised the study and contributed to writing (review and comments). All authors critically revised and reviewed the manuscript and contributed to the final approved version.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <article-title>Scarlet fever</article-title>
          <source>Nurs Stand</source>
          <year>2016</year>
          <month>04</month>
          <day>27</day>
          <volume>30</volume>
          <issue>35</issue>
          <fpage>17</fpage>
          <pub-id pub-id-type="doi">10.7748/ns.30.35.17.s20</pub-id>
          <pub-id pub-id-type="medline">27191292</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Shan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jiao</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ning</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Cui</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Epidemiological trend in scarlet fever incidence in China during the COVID-19 pandemic: a time series analysis</article-title>
          <source>Front Public Health</source>
          <year>2022</year>
          <volume>10</volume>
          <fpage>923318</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36589977"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpubh.2022.923318</pub-id>
          <pub-id pub-id-type="medline">36589977</pub-id>
          <pub-id pub-id-type="pmcid">PMC9799716</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>WW</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Tian</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xiong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Qi</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Forecasting the monthly incidence of scarlet fever in Chongqing, China using the SARIMA model</article-title>
          <source>Epidemiol Infect</source>
          <year>2022</year>
          <month>04</month>
          <day>21</day>
          <volume>150</volume>
          <fpage>e90</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35543101"/>
          </comment>
          <pub-id pub-id-type="doi">10.1017/S0950268822000693</pub-id>
          <pub-id pub-id-type="medline">35543101</pub-id>
          <pub-id pub-id-type="pii">S0950268822000693</pub-id>
          <pub-id pub-id-type="pmcid">PMC9102071</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Seasonality and trend prediction of scarlet fever incidence in mainland China from 2004 to 2018 using a hybrid SARIMA-NARX model</article-title>
          <source>PeerJ</source>
          <year>2019</year>
          <volume>7</volume>
          <fpage>e6165</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30671295"/>
          </comment>
          <pub-id pub-id-type="doi">10.7717/peerj.6165</pub-id>
          <pub-id pub-id-type="medline">30671295</pub-id>
          <pub-id pub-id-type="pii">6165</pub-id>
          <pub-id pub-id-type="pmcid">PMC6339779</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yap</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Geng</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Resurgence of scarlet fever in China: a 13-year population-based surveillance study</article-title>
          <source>Lancet Infect Dis</source>
          <year>2018</year>
          <month>08</month>
          <volume>18</volume>
          <issue>8</issue>
          <fpage>903</fpage>
          <lpage>912</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29858148"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S1473-3099(18)30231-7</pub-id>
          <pub-id pub-id-type="medline">29858148</pub-id>
          <pub-id pub-id-type="pii">S1473-3099(18)30231-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC7185785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>You</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Davies</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Protani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McIntyre</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Scarlet fever epidemic in China caused by Streptococcus pyogenes serotype M12: epidemiologic and molecular analysis</article-title>
          <source>EBioMedicine</source>
          <year>2018</year>
          <month>02</month>
          <volume>28</volume>
          <fpage>128</fpage>
          <lpage>135</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2352-3964(18)30014-8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ebiom.2018.01.010</pub-id>
          <pub-id pub-id-type="medline">29342444</pub-id>
          <pub-id pub-id-type="pii">S2352-3964(18)30014-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC5835554</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jiao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ni</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Epidemiological features and forecast model analysis for the morbidity of influenza in Ningbo, China, 2006-2014</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2017</year>
          <month>05</month>
          <day>25</day>
          <volume>14</volume>
          <issue>6</issue>
          <fpage>559</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph14060559"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph14060559</pub-id>
          <pub-id pub-id-type="medline">28587073</pub-id>
          <pub-id pub-id-type="pii">ijerph14060559</pub-id>
          <pub-id pub-id-type="pmcid">PMC5486245</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Association between meteorological factors and mumps and models for prediction in Chongqing, China</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2022</year>
          <month>05</month>
          <day>29</day>
          <volume>19</volume>
          <issue>11</issue>
          <fpage>6625</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph19116625"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph19116625</pub-id>
          <pub-id pub-id-type="medline">35682208</pub-id>
          <pub-id pub-id-type="pii">ijerph19116625</pub-id>
          <pub-id pub-id-type="pmcid">PMC9180516</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>de Araújo Morais</surname>
              <given-names>LR</given-names>
            </name>
            <name name-style="western">
              <surname>da Silva Gomes</surname>
              <given-names>GS</given-names>
            </name>
          </person-group>
          <article-title>Forecasting daily Covid-19 cases in the world with a hybrid ARIMA and neural network model</article-title>
          <source>Appl Soft Comput</source>
          <year>2022</year>
          <month>09</month>
          <volume>126</volume>
          <fpage>109315</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35854916"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.asoc.2022.109315</pub-id>
          <pub-id pub-id-type="medline">35854916</pub-id>
          <pub-id pub-id-type="pii">S1568-4946(22)00493-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC9283122</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jing</surname>
              <given-names>QL</given-names>
            </name>
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>WB</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>ZC</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>JH</given-names>
            </name>
          </person-group>
          <article-title>Imported cases and minimum temperature drive dengue transmission in Guangzhou, China: evidence from ARIMAX model</article-title>
          <source>Epidemiol Infect</source>
          <year>2018</year>
          <month>07</month>
          <volume>146</volume>
          <issue>10</issue>
          <fpage>1226</fpage>
          <lpage>1235</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29781412"/>
          </comment>
          <pub-id pub-id-type="doi">10.1017/S0950268818001176</pub-id>
          <pub-id pub-id-type="medline">29781412</pub-id>
          <pub-id pub-id-type="pii">S0950268818001176</pub-id>
          <pub-id pub-id-type="pmcid">PMC9134281</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Milinovich</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jing</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Using Baidu search index to predict dengue outbreak in China</article-title>
          <source>Sci Rep</source>
          <year>2016</year>
          <month>12</month>
          <day>01</day>
          <volume>6</volume>
          <fpage>38040</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/srep38040"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/srep38040</pub-id>
          <pub-id pub-id-type="medline">27905501</pub-id>
          <pub-id pub-id-type="pii">srep38040</pub-id>
          <pub-id pub-id-type="pmcid">PMC5131307</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tsao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Basri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Butt</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Digital disease surveillance for emerging infectious diseases: an early warning system using the internet and social media data for COVID-19 forecasting in Canada</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2023</year>
          <month>05</month>
          <day>18</day>
          <volume>302</volume>
          <fpage>861</fpage>
          <lpage>865</lpage>
          <pub-id pub-id-type="doi">10.3233/SHTI230290</pub-id>
          <pub-id pub-id-type="medline">37203518</pub-id>
          <pub-id pub-id-type="pii">SHTI230290</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Koplewitz</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Clemente</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Buckee</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Santillana</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Predicting dengue incidence leveraging internet-based data sources. A case study in 20 cities in Brazil</article-title>
          <source>PLoS Negl Trop Dis</source>
          <year>2022</year>
          <month>01</month>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>e0010071</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pntd.0010071"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pntd.0010071</pub-id>
          <pub-id pub-id-type="medline">35073316</pub-id>
          <pub-id pub-id-type="pii">PNTD-D-20-02104</pub-id>
          <pub-id pub-id-type="pmcid">PMC8824328</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ginsberg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mohebbi</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Brammer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Smolinski</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Brilliant</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Detecting influenza epidemics using search engine query data</article-title>
          <source>Nature</source>
          <year>2009</year>
          <month>02</month>
          <day>19</day>
          <volume>457</volume>
          <issue>7232</issue>
          <fpage>1012</fpage>
          <lpage>1014</lpage>
          <pub-id pub-id-type="doi">10.1038/nature07634</pub-id>
          <pub-id pub-id-type="medline">19020500</pub-id>
          <pub-id pub-id-type="pii">nature07634</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jia</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Using Baidu search values to monitor and predict the confirmed cases of COVID-19 in China: - evidence from Baidu index</article-title>
          <source>BMC Infect Dis</source>
          <year>2021</year>
          <month>01</month>
          <day>21</day>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>98</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcinfectdis.biomedcentral.com/articles/10.1186/s12879-020-05740-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12879-020-05740-x</pub-id>
          <pub-id pub-id-type="medline">33478425</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12879-020-05740-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC7819631</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Duan</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Using Baidu search index to monitor and predict newly diagnosed cases of HIV/AIDS, syphilis and gonorrhea in China: estimates from a vector autoregressive (VAR) model</article-title>
          <source>BMJ Open</source>
          <year>2020</year>
          <month>03</month>
          <day>24</day>
          <volume>10</volume>
          <issue>3</issue>
          <fpage>e036098</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=32209633"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2019-036098</pub-id>
          <pub-id pub-id-type="medline">32209633</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2019-036098</pub-id>
          <pub-id pub-id-type="pmcid">PMC7202716</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <source>National Health Commission of the People's Republic of China</source>
          <access-date>2023-04-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.nhc.gov.cn/">http://www.nhc.gov.cn/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="web">
          <source>Baidu search index</source>
          <access-date>2023-05-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://index.baidu.com/">https://index.baidu.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
          <source>ChinaZ.com</source>
          <access-date>2023-04-26</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://data.chinaz.com/">https://data.chinaz.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
          <source>Baidu index demand map</source>
          <access-date>2023-05-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://index.baidu.com/v2/main/index.html#/demand/">https://index.baidu.com/v2/main/index.html#/demand/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
          <source>Baidu Encyclopedia</source>
          <access-date>2023-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://baike.baidu.com/">https://baike.baidu.com/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <article-title>Health medical code</article-title>
          <source>Baidu</source>
          <access-date>2023-04-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jiankang.baidu.com/widescreen/home">https://jiankang.baidu.com/widescreen/home</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Nsoesie</surname>
              <given-names>EO</given-names>
            </name>
            <name name-style="western">
              <surname>Lv</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chunara</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Monitoring influenza epidemics in China with search query from Baidu</article-title>
          <source>PLoS One</source>
          <year>2013</year>
          <volume>8</volume>
          <issue>5</issue>
          <fpage>e64323</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0064323"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0064323</pub-id>
          <pub-id pub-id-type="medline">23750192</pub-id>
          <pub-id pub-id-type="pii">PONE-D-13-00331</pub-id>
          <pub-id pub-id-type="pmcid">PMC3667820</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhong</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rutherford</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Using Google Trends for influenza surveillance in South China</article-title>
          <source>PLoS One</source>
          <year>2013</year>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>e55205</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0055205"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0055205</pub-id>
          <pub-id pub-id-type="medline">23372837</pub-id>
          <pub-id pub-id-type="pii">PONE-D-12-26520</pub-id>
          <pub-id pub-id-type="pmcid">PMC3555864</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hulth</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rydevik</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Linde</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Web queries as a source for syndromic surveillance</article-title>
          <source>PLoS One</source>
          <year>2009</year>
          <volume>4</volume>
          <issue>2</issue>
          <fpage>e4378</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0004378"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0004378</pub-id>
          <pub-id pub-id-type="medline">19197389</pub-id>
          <pub-id pub-id-type="pmcid">PMC2634970</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhen</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Search trends and prediction of human brucellosis using Baidu index data from 2011 to 2018 in China</article-title>
          <source>Sci Rep</source>
          <year>2020</year>
          <month>04</month>
          <day>03</day>
          <volume>10</volume>
          <issue>1</issue>
          <fpage>5896</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-020-62517-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-020-62517-7</pub-id>
          <pub-id pub-id-type="medline">32246053</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-020-62517-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC7125199</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lv</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rutherford</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Early detection of an epidemic erythromelalgia outbreak using Baidu search data</article-title>
          <source>Sci Rep</source>
          <year>2015</year>
          <month>07</month>
          <day>28</day>
          <volume>5</volume>
          <fpage>12649</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/srep12649"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/srep12649</pub-id>
          <pub-id pub-id-type="medline">26218589</pub-id>
          <pub-id pub-id-type="pii">srep12649</pub-id>
          <pub-id pub-id-type="pmcid">PMC4517510</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Modeling the effects of air pollutants and meteorological factors on scarlet fever in five provinces, Northwest China, 2013-2018</article-title>
          <source>J Theor Biol</source>
          <year>2022</year>
          <month>07</month>
          <day>07</day>
          <volume>544</volume>
          <fpage>111134</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jtbi.2022.111134</pub-id>
          <pub-id pub-id-type="medline">35469892</pub-id>
          <pub-id pub-id-type="pii">S0022-5193(22)00132-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lamagni</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Guy</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chand</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Henderson</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Chalker</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Saliba</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Elliot</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>GE</given-names>
            </name>
            <name name-style="western">
              <surname>Rushton</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sheridan</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Ramsay</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AP</given-names>
            </name>
          </person-group>
          <article-title>Resurgence of scarlet fever in England, 2014-16: a population-based surveillance study</article-title>
          <source>Lancet Infect Dis</source>
          <year>2018</year>
          <month>02</month>
          <volume>18</volume>
          <issue>2</issue>
          <fpage>180</fpage>
          <lpage>187</lpage>
          <pub-id pub-id-type="doi">10.1016/S1473-3099(17)30693-X</pub-id>
          <pub-id pub-id-type="medline">29191628</pub-id>
          <pub-id pub-id-type="pii">S1473-3099(17)30693-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Seo</surname>
              <given-names>MH</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>YS</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Min</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Ha</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>JK</given-names>
            </name>
          </person-group>
          <article-title>Incidence and characteristics of scarlet fever, South Korea, 2008-2015</article-title>
          <source>Emerg Infect Dis</source>
          <year>2017</year>
          <month>04</month>
          <volume>23</volume>
          <issue>4</issue>
          <fpage>658</fpage>
          <lpage>661</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3201/eid2304.160773"/>
          </comment>
          <pub-id pub-id-type="doi">10.3201/eid2304.160773</pub-id>
          <pub-id pub-id-type="medline">28322696</pub-id>
          <pub-id pub-id-type="pmcid">PMC5367408</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lv</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Spatiotemporal dynamics and potential ecological drivers of acute respiratory infectious diseases: an example of scarlet fever in Sichuan Province</article-title>
          <source>BMC Public Health</source>
          <year>2022</year>
          <month>11</month>
          <day>21</day>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>2139</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-022-14469-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12889-022-14469-y</pub-id>
          <pub-id pub-id-type="medline">36411416</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12889-022-14469-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC9680133</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eysenbach</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Infodemiology: tracking flu-related searches on the web for syndromic surveillance</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2006</year>
          <volume>2006</volume>
          <fpage>244</fpage>
          <lpage>248</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/17238340"/>
          </comment>
          <pub-id pub-id-type="medline">17238340</pub-id>
          <pub-id pub-id-type="pii">86095</pub-id>
          <pub-id pub-id-type="pmcid">PMC1839505</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
