<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id><journal-id journal-id-type="publisher-id">jmir</journal-id><journal-id journal-id-type="index">1</journal-id><journal-title>Journal of Medical Internet Research</journal-title><abbrev-journal-title>J Med Internet Res</abbrev-journal-title><issn pub-type="epub">1438-8871</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v27i1e71786</article-id><article-id pub-id-type="doi">10.2196/71786</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>A Deep Learning Framework for Using Search Engine Data to Predict Influenza-Like Illness and Distinguish Epidemic and Nonepidemic Seasons: Multifeature Time Series Analysis</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Li</surname><given-names>Ji</given-names></name><degrees>MM</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Yan</surname><given-names>Xiangyu</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Chu</surname><given-names>Xingjie</given-names></name><degrees>BM</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhang</surname><given-names>Ying</given-names></name><degrees>MPH</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Liu</surname><given-names>Guoliang</given-names></name><degrees>BM</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Li</surname><given-names>Lin</given-names></name><degrees>MM</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Li</surname><given-names>Yue</given-names></name><degrees>MMed</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Dong</surname><given-names>Xiaochun</given-names></name><degrees>MM</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Mei</surname><given-names>Zihan</given-names></name><degrees>BS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Liu</surname><given-names>Zhengkun</given-names></name><degrees>BEc</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Yuan</surname><given-names>Jinyue</given-names></name><degrees>BM</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sun</surname><given-names>Xiaohan</given-names></name><degrees>BEng</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Cao</surname><given-names>Chunxia</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>School of Disaster and Emergency Medicine, Tianjin University</institution><addr-line>No. 92 Weijin Road, Nankai District</addr-line><addr-line>Tianjin</addr-line><country>China</country></aff><aff id="aff2"><institution>College of Management and Economics, Tianjin University</institution><addr-line>Tianjin</addr-line><country>China</country></aff><aff id="aff3"><institution>Langfang Center for Disease Prevention and Control</institution><addr-line>Hebei</addr-line><country>China</country></aff><aff id="aff4"><institution>Tianjin Centers for Disease Control and Prevention</institution><addr-line>Tianjin</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Ibrahim</surname><given-names>Abdelhameed</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Ahmar</surname><given-names>Ansari Saleh</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Chunxia Cao, PhD, School of Disaster and Emergency Medicine, Tianjin University, No. 92 Weijin Road, Nankai District, Tianjin, 300072, China, 86 13512065620; <email>caochunxia@tju.edu.cn</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>11</day><month>8</month><year>2025</year></pub-date><volume>27</volume><elocation-id>e71786</elocation-id><history><date date-type="received"><day>26</day><month>01</month><year>2025</year></date><date date-type="rev-recd"><day>25</day><month>06</month><year>2025</year></date><date date-type="accepted"><day>26</day><month>06</month><year>2025</year></date></history><copyright-statement>&#x00A9; Ji Li, Xiangyu Yan, Xingjie Chu, Ying Zhang, Guoliang Liu, Lin Li, Yue Li, Xiaochun Dong, Zihan Mei, Zhengkun Liu, Jinyue Yuan, Xiaohan Sun, Chunxia Cao. Originally published in the Journal of Medical Internet Research (<ext-link ext-link-type="uri" xlink:href="https://www.jmir.org">https://www.jmir.org</ext-link>), 11.8.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.jmir.org/">https://www.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.jmir.org/2025/1/e71786"/><abstract><sec><title>Background</title><p>The seasonal influenza epidemic poses a persistent and severe threat to global public health. Web-based search data are recognized as a valuable source for forecasting influenza or other respiratory tract infection epidemics. Current influenza prediction studies typically focus on seasonal trends in traditional monitoring data, neglecting the sensitivity of different web-based search terms to seasonal changes, thereby increasing prediction challenges.</p></sec><sec><title>Objective</title><p>The aim of this study was to propose a deep learning framework for different influenza epidemic states based on Baidu index and percentage of influenza-like illness (ILI%).</p></sec><sec sec-type="methods"><title>Methods</title><p>Official weekly ILI% data from 2013 to 2024 were extracted from the Chinese National Notifiable Infectious Disease Reporting System (NIDRIS). Based on the Baidu index, influenza-related search indexes were acquired for the corresponding time periods. To explore the association between influenza-related search queries and ILI%, the study conducted a cross-correlation analysis. The study period was divided into influenza epidemic and nonepidemic period. The study finally used the convolutional long short-term memory (CLSTM) network framework to predict influenza epidemics with 1&#x2010;3 weeks ahead for the all-time period and epidemic + nonepidemic period. The evaluation metrics included model stability metric, accuracy metrics, and explanatory power metric.</p></sec><sec sec-type="results"><title>Results</title><p>The ILI% presented a regular seasonal high incidence in China. Meanwhile, the prediction of ILI% after dividing the epidemic and nonepidemic seasons (mean absolute percentage error [MAPE]=10.730%, mean square error [MSE]=0.884, mean absolute error [MAE]=0.649, root-mean-square error [RMSE]=0.940, and <italic>R</italic><sup>2</sup>=0.877) was better than that of the all-time period (MAPE=12.784%, MSE=1.513, MAE=0.744, RMSE=1.230, and <italic>R</italic><sup>2</sup>=0.786). In addition, we found that the ILI% + Baidu search index predicts better than only the ILI% regardless of the time period and lag time of the study. Comparative analysis with long short-term memory (LSTM) and transformer models demonstrated that CLSTM achieved superior performance in 1 week-ahead ILI% predictions using ILI% + Baidu index data in epidemic + nonepidemic period (MAPE=11.824%, MSE=1.243, MAE=0.723, RMSE=1.115, and <italic>R</italic><sup>2</sup>=0.827). Furthermore, CLSTM comprehensively surpasses LSTM in computational efficiency, complexity, extrapolation capability, and stability while partially outperforming transformer models.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study shows strong potential for influenza prediction by combining Baidu index data with traditional surveillance and specific keywords for epidemic and nonepidemic seasons. It provides a new perspective for public health preparedness. This research is expected to support early warning systems for influenza and other diseases. Future work will further optimize these models for more timely and accurate predictions, enhancing public health responses.</p></sec></abstract><kwd-group><kwd>influenza</kwd><kwd>CLSTM framework</kwd><kwd>Baidu index</kwd><kwd>influenza epidemic</kwd><kwd>nonepidemic seasons</kwd><kwd>convolutional long short-term memory</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Influenza poses a persistent and severe threat to global public health [<xref ref-type="bibr" rid="ref1">1</xref>]. The World Health Organization estimates that annual epidemics of influenza result in 1 billion infections, 3-5 million severe cases of influenza, and 300,000-650,000 deaths globally [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. The National Health Commission of China reported that in 2020 and 2021, there were 1,145,278 and 668,246 influenza cases, with incidence rates of 81.5816 and 47.4008 per 100,000, respectively [<xref ref-type="bibr" rid="ref4">4</xref>]. China has a significant global share of patients with influenza, especially during the high influenza season. Influenza in China may significantly influence global influenza trends [<xref ref-type="bibr" rid="ref5">5</xref>]. China has a profound impact on global influenza due to its large population and its important role in global influenza surveillance, prediction, and early warning.</p><p>Currently, the main global influenza surveillance methods include monitoring influenza-like illness (ILI) and influenza virus positivity. These methods aim to capture fluctuations in patient visits and the intensity of influenza virus transmission. This provides insight into the onset, peak, and end of influenza [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Traditional surveillance methods, such as weekly data reports, play an important role in influenza surveillance but often struggle with timely early warnings due to inherent delays. In contrast, the popularity of the web and advancements in data analysis have made search engine data highly useful for identifying infectious disease outbreaks in advance.</p><p>Google Flu Trends created a new era that used Google search data to predict the percentage of influenza-like illness (ILI%) in the United States [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Thereafter, multisource electronic data including web-based search data [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref12">12</xref>], influenza surveillance data [<xref ref-type="bibr" rid="ref10">10</xref>], influenza-related posts on Twitter [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref15">15</xref>], Wikipedia access logs [<xref ref-type="bibr" rid="ref16">16</xref>], and electronic health records [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref17">17</xref>] were integrated with mathematical models to track illness activities with very good predictive results. However, the model was not stable because the influenza trend exceeded the peak of the epidemic by more than 140% in 2013 in the United States and sparked a hot discussion about the limitation of search data in infectious disease research [<xref ref-type="bibr" rid="ref18">18</xref>]. Some studies had constructed models to improve forecasting accuracy in cities such as New York [<xref ref-type="bibr" rid="ref19">19</xref>], Melbourne [<xref ref-type="bibr" rid="ref20">20</xref>], and Hong Kong [<xref ref-type="bibr" rid="ref21">21</xref>]. The field of digital epidemiology is still in an early stage, but it has begun to be used to forecast infectious disease epidemic trends, especially during the COVID-19 pandemic [<xref ref-type="bibr" rid="ref22">22</xref>]. However, web-based search terms are vast and complex. Even within the same topic, time series correlations between search terms are weak. Current influenza prediction studies typically focus on seasonal trends in traditional monitoring data, neglecting the sensitivity of different web-based search terms to seasonal changes, thereby increasing prediction challenges.</p><p>Accordingly, this study proposed a deep learning framework for multifeature time series for different influenza epidemic states. The framework integrated Baidu index and traditional surveillance data to address the complex challenges of predicting influenza trends. In particular, the study divided the influenza epidemic states into epidemic and nonepidemic seasons. This adjustment not only allows the framework to better capture changes in influenza trends but also optimizes prediction accuracy. By integrating data from multiple sources, the framework can adjust its forecasting strategy across different influenza epidemic states.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Data Collection</title><p>The ILI% is the proportion of patients with ILI divided by the total number of physician visits. The ILI% based on weekly reports in Langfang, Hebei Province, China, was extracted from the Chinese National Notifiable Infectious Disease Reporting System (NIDRIS) for influenza from October 2013 to March 2024. Patients with ILI were defined as outpatients of any age with acute respiratory infection syndrome with fever &#x2265;38 &#x00B0;C and cough or sore throat.</p><p>Baidu index is a statistical indicator that represents the search volume of demanding keywords or phrases based on Baidu&#x2019;s search query logs, which is the largest search engine in China [<xref ref-type="bibr" rid="ref23">23</xref>]. This study summarized influenza-related keywords that might correlate with the trend of ILI% and selected the keywords and the time range from October 2013 to March 2024. The search data were based on personal computer and personal mobile phone data.</p></sec><sec id="s2-2"><title>Descriptive Analysis</title><p>A descriptive analysis was used to show the characteristics of the current ILI% and the current search indices of different keywords on the Baidu index. This study divided the study period based on the characteristics of influenza epidemics. According to the latest influenza surveillance plan [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>], the epidemic season is from week 40 of each year to week 13 of the following year, while the nonepidemic season is from week 14 to week 39. This division helps align with the seasonal patterns of influenza outbreaks [<xref ref-type="bibr" rid="ref27">27</xref>]. The cross-correlation coefficient was calculated to explore the association between the influenza-related search terms data and the ILI% of the epidemic season and the nonepidemic season, respectively. The study also analyzed the correlation between the previous week&#x2019;s search index (from week 1 to 4) and the ILI% of the epidemic season and the nonepidemic season. A correlation coefficient closer to 1 or &#x2013;1 indicates a stronger correlation, and a correlation coefficient closer to 0 indicates a weaker correlation. The cross-correlation coefficient was calculated between each variable to observe the correlations among the variables. After performing the correlation analysis, the variables with correlation coefficients above 0.5 were selected. These variables were used in different lags to develop predicting models. This approach aimed to improve prediction accuracy based on previous studies [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref28">28</xref>].</p></sec><sec id="s2-3"><title>Deep Learning Framework for Multifeature Time Series</title><p>To effectively leverage the useful information in surveillance data and Baidu index data, this study proposed a deep learning framework for multifeature time series to address the challenge of predicting real-world influenza trends (<xref ref-type="fig" rid="figure1">Figure 1</xref>). By fully mining the inherent characteristics of data and establishing the mapping relationship between features and results, the framework could complete the task of time series prediction in a scientific and robust manner. The mathematical formulation of the framework is shown in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>CLSTM network framework. CLSTM: convolutional long short-term memory; GAF: gated attention fusion; ILI%: percentage of influenza-like illness; LSTM: long short-term memory; MLP: multiple-layer perceptron; VMD: variational mode decomposition.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e71786_fig01.png"/></fig><p>The models used in this study were based on an encoder-decoder framework. The input of the encoder was the data, including historical ILI% and Baidu keyword searches. The advanced ILI% forecast results were obtained from the output of the decoder. For observed ILI%, the variational mode decomposition algorithm [<xref ref-type="bibr" rid="ref29">29</xref>] was applied to decompose original signal into multiple intrinsic mode functions. This helped remove redundant information from the observed ILI%, thereby improving prediction accuracy [<xref ref-type="bibr" rid="ref30">30</xref>]. A time window was set and slid during each decomposition to generate new subsignals while preventing information leakage. For the Baidu index, transformer was used for the feature extraction in this study. The method used a self-attentive mechanism to capture temporal dependencies and semantic relationships in the sequences. This allowed it to extract key features that are useful for predicting ILI%. In this way, feature extraction could more accurately reflect the link between search data and influenza activity.</p><p>This study used the classical encoder-decoder framework for algorithm construction. The encoder part was divided into backbone and fusion parts. Data from different modalities were input into the encoder through 2 separate channels. The backbone part, which is a convolutional long short-term memory (CLSTM) network, was used to learn the corresponding features of each modality {M<sub>1</sub>, M<sub>2</sub>}. Gated attention fusion model was used in the fusion part. Gated attention fusion integrated features {M<sub>1</sub>, M<sub>2</sub>} from the backbone. It generated a query, key, and value using the attention mechanism and computes attention weights. Then, these weights were processed by softmax, used to weight the value. Subsequently, the weighted values were used to enable the model to selectively focus on key features through the gating mechanism, resulting in the joint feature, M<sub>y</sub>. The joint feature M<sub>y</sub> was used as input data and sent into the decoder. In the decoder, the CLSTM module was used to decode the state vector, while the multiple-layer perceptron transformed the features generated by the CLSTM into the final ILI% prediction. In the model validation, the study introduced long short-term memory (LSTM) and transformer as baseline comparators, ensuring fair evaluation through identical training sets and assessment metrics. To further verify generalizability, the model was validated using independent datasets from Tianjin, China.</p></sec><sec id="s2-4"><title>Statistical Analysis</title><p>The ILI% surveillance data were divided into 2 parts, the training set and the test set. The training set was from the 14th week of 2013 to the 10th week of 2022, and the test set was from the 11th week of 2022 to the 13th week of 2024 for the whole study period. The training and test sets for the epidemic and nonepidemic seasons were divided according to their respective study times in a ratio of 8:2 and assigned in time order. This study used 3 types of indicators to evaluate the performance of the prediction model, including model stability metric, accuracy metrics, and explanatory power metric (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). Stability metric mainly uses the mean absolute percentage error (MAPE). Accuracy metrics include mean square error (MSE), root-mean-square error (RMSE), and mean absolute error (MAE). Explanatory power metric mainly uses the coefficient of determination (<italic>R</italic><sup>2</sup>). When <italic>R</italic><sup>2</sup> exceeds 0.7, while MSE, RMSE, and MAE values approach 0 and MAPE falls below 20%, it indicates strong predictive performance of the model [<xref ref-type="bibr" rid="ref31">31</xref>]. In addition to model performance, the models&#x2019; computational efficiency and computational complexity analysis were used to the models&#x2019; comparison. To evaluate computational efficiency, floating-point operations per second (FLOPs) can be used because it directly reflects the amount of computational resources and processing speed required by the model when performing computational tasks. Similarly, parameters indicate the model&#x2019;s complexity and memory footprint, which are crucial for practical deployment. To evaluate computational complexity analysis, the Big-O complexity estimates were used to assess scalability. Moreover, hyperparameter sensitivity analysis was conducted to investigate how variations in model parameters (the number of attention heads, the kernel size, and the number of layers) affect predictive performance. Shapley Additive Explanations (SHAP) analysis was used to interpret feature contributions in the CLSTM model. Finally, the convergence analysis was used to demonstrate training stability through comparative learning curves across multiple influenza seasons.</p><p>A box plot was introduced to illustrate the distribution of prediction errors. All data analyses were performed using SPSS Statistics software (version 23; IBM Corporation) and Python (version 3.4.0; Python Software Foundation). All data were checked for completeness and accuracy before analysis.</p></sec><sec id="s2-5"><title>Ethical Considerations</title><p>The study used deidentified surveillance data from the Chinese NIDRIS in China. The study received formal ethics approval from the research ethics board of Tianjin University (approval number TJUE-2025-222), and the requirement for informed consent was waived. The study did not involve direct human participants research, and no compensation was provided to participants.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>ILI% Trend From 2013 to 2024</title><p>The ILI% presented a regular seasonal high incidence in China. The average weekly ILI% was 4.36%, respectively. The highest ILI% was in the 50th week in 2022 (21.03%) and the lowest was in the 40th week in 2016 (0.86%). The influenza season is clearly reflected in the period from October to March each year, and there is only 1 influenza peak in the whole influenza cycle (<xref ref-type="fig" rid="figure2">Figure 2</xref>). ILI% has a trend of increasing annually (<xref ref-type="fig" rid="figure3">Figure 3</xref>). The observed ILI% showed a clear periodic pattern, with the ILI% being higher than the yearly average for the period from October to March (<xref ref-type="fig" rid="figure3">Figure 3</xref>).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>ILI% trend from 2013 to 2024. ILI%: percentage of influenza-like illness.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e71786_fig02.png"/></fig><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>The seasonal and trend decomposition of the percentage influenza-like illness by week from 2013 to 2024.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e71786_fig03.png"/></fig></sec><sec id="s3-2"><title>Correlation Analysis Between Baidu Index and ILI%</title><p>Based on the literature searched on the web, the Baidu search terms in this study that were screened out were all related to influenza. Overall, the study observed a high correlation between the Baidu search terms and the ILI% in all databases. The terms were classified into 4 categories: influenza essential facts, influenza symptoms, influenza treatment, and influenza prevention (<xref ref-type="table" rid="table1">Table 1</xref> and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). The correlation coefficients differed between the influenza epidemic and nonepidemic seasons.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Correlations between Baidu index and percentage of influenza-like illness in epidemic and nonepidemic seasons at different lags.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Category and terms in Chinese</td><td align="left" valign="bottom">Terms in English</td><td align="left" valign="bottom" colspan="3">Cross-correlation coefficient of epidemic season</td><td align="left" valign="bottom" colspan="3">Cross-correlation coefficient of nonepidemic season</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom"/><td align="left" valign="bottom">Lag 1</td><td align="left" valign="bottom">Lag 2</td><td align="left" valign="bottom">Lag 3</td><td align="left" valign="bottom">Lag 1</td><td align="left" valign="bottom">Lag 2</td><td align="left" valign="bottom">Lag 3</td></tr></thead><tbody><tr><td align="left" valign="top">Influenza essential facts</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6D41;&#x884C;&#x6027;&#x611F;&#x5192;</td><td align="left" valign="top">Influenza</td><td align="left" valign="top">0.692</td><td align="left" valign="top">0.628</td><td align="left" valign="top">0.525</td><td align="left" valign="top">0.421</td><td align="left" valign="top">0.406</td><td align="left" valign="top">0.389</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x5B63;&#x8282;&#x6027;&#x6D41;&#x611F;</td><td align="left" valign="top">Seasonal influenza</td><td align="left" valign="top">0.587</td><td align="left" valign="top">0.485</td><td align="left" valign="top">0.399</td><td align="left" valign="top">0.364</td><td align="left" valign="top">0.342</td><td align="left" valign="top">0.320</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6D41;&#x611F;&#x4F20;&#x64AD;&#x9014;&#x5F84;</td><td align="left" valign="top">Influenza transmission route</td><td align="left" valign="top">0.631</td><td align="left" valign="top">0.642</td><td align="left" valign="top">0.589</td><td align="left" valign="top">0.201</td><td align="left" valign="top">0.213</td><td align="left" valign="top">0.279</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6D41;&#x611F;&#x75C5;&#x6BD2;</td><td align="left" valign="top">Influenza virus</td><td align="left" valign="top">0.596</td><td align="left" valign="top">0.531</td><td align="left" valign="top">0.423</td><td align="left" valign="top">0.320</td><td align="left" valign="top">0.320</td><td align="left" valign="top">0.318</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6D41;&#x611F;&#x5E76;&#x53D1;&#x75C7;</td><td align="left" valign="top">Influenza complications</td><td align="left" valign="top">0.546</td><td align="left" valign="top">0.455</td><td align="left" valign="top">0.321</td><td align="left" valign="top">0.484</td><td align="left" valign="top">0.482</td><td align="left" valign="top">0.484</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6D41;&#x611F;&#x6D41;&#x884C;</td><td align="left" valign="top">Influenza epidemic</td><td align="left" valign="top">0.541</td><td align="left" valign="top">0.518</td><td align="left" valign="top">0.475</td><td align="left" valign="top">0.203</td><td align="left" valign="top">0.197</td><td align="left" valign="top">0.200</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x4E0A;&#x547C;&#x5438;&#x9053;&#x611F;&#x67D3;</td><td align="left" valign="top">Upper respiratory tract infection</td><td align="left" valign="top">0.705</td><td align="left" valign="top">0.620</td><td align="left" valign="top">0.499</td><td align="left" valign="top">0.659</td><td align="left" valign="top">0.641</td><td align="left" valign="top">0.626</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x5C0F;&#x513F;&#x611F;&#x5192;</td><td align="left" valign="top">Common cold in children</td><td align="left" valign="top">0.493</td><td align="left" valign="top">0.539</td><td align="left" valign="top">0.564</td><td align="left" valign="top">0.702</td><td align="left" valign="top">0.704</td><td align="left" valign="top">0.686</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6C14;&#x7BA1;&#x708E;</td><td align="left" valign="top">Tracheitis</td><td align="left" valign="top">0.011</td><td align="left" valign="top">0.014</td><td align="left" valign="top">0.071</td><td align="left" valign="top">0.519</td><td align="left" valign="top">0.521</td><td align="left" valign="top">0.530</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6D41;&#x611F;&#x55DC;&#x8840;&#x6746;&#x83CC;</td><td align="left" valign="top"><italic>Haemophilus influenzae</italic></td><td align="left" valign="top">0.344</td><td align="left" valign="top">0.371</td><td align="left" valign="top">0.380</td><td align="left" valign="top">0.650</td><td align="left" valign="top">0.658</td><td align="left" valign="top">0.667</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6D41;&#x611F;&#x6297;&#x539F;</td><td align="left" valign="top">Influenza antigen</td><td align="left" valign="top">0.315</td><td align="left" valign="top">0.123</td><td align="left" valign="top">0.025</td><td align="left" valign="top">0.531</td><td align="left" valign="top">0.503</td><td align="left" valign="top">0.479</td></tr><tr><td align="left" valign="top">Influenza symptoms</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x5934;&#x75DB;</td><td align="left" valign="top">Headache</td><td align="left" valign="top">0.181</td><td align="left" valign="top">0.262</td><td align="left" valign="top">0.347</td><td align="left" valign="top">0.551</td><td align="left" valign="top">0.544</td><td align="left" valign="top">0.535</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x54BD;&#x75DB;</td><td align="left" valign="top">Sore throat</td><td align="left" valign="top">0.620</td><td align="left" valign="top">0.468</td><td align="left" valign="top">0.323</td><td align="left" valign="top">0.580</td><td align="left" valign="top">0.536</td><td align="left" valign="top">0.510</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x53D1;&#x70E7;</td><td align="left" valign="top">Fever</td><td align="left" valign="top">0.365</td><td align="left" valign="top">0.378</td><td align="left" valign="top">0.388</td><td align="left" valign="top">0.601</td><td align="left" valign="top">0.596</td><td align="left" valign="top">0.591</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x55DC;&#x7761;</td><td align="left" valign="top">Drowsiness</td><td align="left" valign="top">0.486</td><td align="left" valign="top">0.468</td><td align="left" valign="top">0.411</td><td align="left" valign="top">0.608</td><td align="left" valign="top">0.597</td><td align="left" valign="top">0.590</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x54B3;&#x55FD;</td><td align="left" valign="top">Cough</td><td align="left" valign="top">0.514</td><td align="left" valign="top">0.436</td><td align="left" valign="top">0.260</td><td align="left" valign="top">0.036</td><td align="left" valign="top">0.075</td><td align="left" valign="top">0.106</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6253;&#x55B7;&#x568F;</td><td align="left" valign="top">Sneeze</td><td align="left" valign="top">0.052</td><td align="left" valign="top">0.109</td><td align="left" valign="top">0.196</td><td align="left" valign="top">0.662</td><td align="left" valign="top">0.667</td><td align="left" valign="top">0.681</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6D41;&#x9F3B;&#x6D95;</td><td align="left" valign="top">Runny nose</td><td align="left" valign="top">0.442</td><td align="left" valign="top">0.453</td><td align="left" valign="top">0.463</td><td align="left" valign="top">0.618</td><td align="left" valign="top">0.615</td><td align="left" valign="top">0.611</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6D41;&#x611F;&#x75C7;&#x72B6;</td><td align="left" valign="top">Influenza symptom</td><td align="left" valign="top">0.406</td><td align="left" valign="top">0.371</td><td align="left" valign="top">0.311</td><td align="left" valign="top">0.654</td><td align="left" valign="top">0.644</td><td align="left" valign="top">0.622</td></tr><tr><td align="left" valign="top">Influenza treatment</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x611F;&#x5EB7;</td><td align="left" valign="top">Compound paracetamol and amantadine hydrochloride tablets</td><td align="left" valign="top">0.468</td><td align="left" valign="top">0.281</td><td align="left" valign="top">0.142</td><td align="left" valign="top">0.558</td><td align="left" valign="top">0.507</td><td align="left" valign="top">0.464</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x611F;&#x5192;&#x6E05;&#x70ED;&#x9897;&#x7C92;</td><td align="left" valign="top">Ganmao Qingre Keli</td><td align="left" valign="top">0.466</td><td align="left" valign="top">0.292</td><td align="left" valign="top">0.136</td><td align="left" valign="top">0.550</td><td align="left" valign="top">0.503</td><td align="left" valign="top">0.464</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x9000;&#x70E7;&#x836F;</td><td align="left" valign="top">Antipyretics</td><td align="left" valign="top">0.554</td><td align="left" valign="top">0.433</td><td align="left" valign="top">0.355</td><td align="left" valign="top">0.546</td><td align="left" valign="top">0.491</td><td align="left" valign="top">0.447</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x8FDE;&#x82B1;&#x6E05;&#x761F;</td><td align="left" valign="top">Lianhua Qingwen capsule</td><td align="left" valign="top">0.299</td><td align="left" valign="top">0.155</td><td align="left" valign="top">0.065</td><td align="left" valign="top">0.501</td><td align="left" valign="top">0.487</td><td align="left" valign="top">0.475</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6297;&#x751F;&#x7D20;</td><td align="left" valign="top">Antibiotic</td><td align="left" valign="top">0.082</td><td align="left" valign="top">0.142</td><td align="left" valign="top">0.201</td><td align="left" valign="top">0.539</td><td align="left" valign="top">0.546</td><td align="left" valign="top">0.532</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x5EB7;&#x6CF0;&#x514B;</td><td align="left" valign="top">Compound pseudoephedrine HCl<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup>-sustained release capsules</td><td align="left" valign="top">0.161</td><td align="left" valign="top">0.030</td><td align="left" valign="top">0.154</td><td align="left" valign="top">0.497</td><td align="left" valign="top">0.537</td><td align="left" valign="top">0.561</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6E05;&#x5F00;&#x7075;&#x9897;&#x7C92;</td><td align="left" valign="top">Qingkailingkeli</td><td align="left" valign="top">0.210</td><td align="left" valign="top">0.046</td><td align="left" valign="top">0.085</td><td align="left" valign="top">0.484</td><td align="left" valign="top">0.502</td><td align="left" valign="top">0.517</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x963F;&#x83AB;&#x897F;&#x6797;</td><td align="left" valign="top">Amoxicillin</td><td align="left" valign="top">0.669</td><td align="left" valign="top">0.565</td><td align="left" valign="top">0.425</td><td align="left" valign="top">0.656</td><td align="left" valign="top">0.634</td><td align="left" valign="top">0.607</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x5965;&#x53F8;&#x4ED6;&#x97E6;&#x9897;&#x7C92;</td><td align="left" valign="top">Oseltamivir phosphate capsules</td><td align="left" valign="top">0.517</td><td align="left" valign="top">0.496</td><td align="left" valign="top">0.441</td><td align="left" valign="top">0.239</td><td align="left" valign="top">0.394</td><td align="left" valign="top">0.553</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6297;&#x75C5;&#x6BD2;&#x53E3;&#x670D;&#x6DB2;</td><td align="left" valign="top">Kangbingdukoufuye</td><td align="left" valign="top">0.528</td><td align="left" valign="top">0.338</td><td align="left" valign="top">0.203</td><td align="left" valign="top">0.413</td><td align="left" valign="top">0.354</td><td align="left" valign="top">0.302</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6D41;&#x611F;&#x4E38;</td><td align="left" valign="top">Liuganwan</td><td align="left" valign="top">0.535</td><td align="left" valign="top">0.387</td><td align="left" valign="top">0.267</td><td align="left" valign="top">0.224</td><td align="left" valign="top">0.199</td><td align="left" valign="top">0.145</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x83CA;&#x82B1;&#x8336;</td><td align="left" valign="top">Chrysanthemum tea</td><td align="left" valign="top">0.404</td><td align="left" valign="top">0.412</td><td align="left" valign="top">0.400</td><td align="left" valign="top">0.566</td><td align="left" valign="top">0.575</td><td align="left" valign="top">0.582</td></tr><tr><td align="left" valign="top">Influenza prevention</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6D41;&#x611F;&#x75AB;&#x82D7;&#x63A5;&#x79CD;</td><td align="left" valign="top">Influenza vaccine vaccination</td><td align="left" valign="top">0.275</td><td align="left" valign="top">0.241</td><td align="left" valign="top">0.231</td><td align="left" valign="top">0.675</td><td align="left" valign="top">0.672</td><td align="left" valign="top">0.674</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x6D41;&#x611F;&#x9632;&#x63A7;</td><td align="left" valign="top">Influenza prevention and control</td><td align="left" valign="top">0.473</td><td align="left" valign="top">0.429</td><td align="left" valign="top">0.387</td><td align="left" valign="top">0.628</td><td align="left" valign="top">0.624</td><td align="left" valign="top">0.614</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x59DC;&#x7CD6;&#x6C34;</td><td align="left" valign="top">Ginger syrup</td><td align="left" valign="top">0.053</td><td align="left" valign="top">0.098</td><td align="left" valign="top">0.244</td><td align="left" valign="top">0.543</td><td align="left" valign="top">0.557</td><td align="left" valign="top">0.566</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>HCI: hydrogen chloride.</p></fn></table-wrap-foot></table-wrap><p>When analyzing the use of keywords in different time periods, it was found that the focus on keyword categories differed between the influenza epidemic and nonepidemic seasons (<xref ref-type="table" rid="table1">Table 1</xref> and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). Specifically, in the influenza epidemic season, the significant keywords with a cross-correlation coefficient greater than 0.5 mainly concentrated on the category of influenza essential facts. These keywords usually focused on basic information about influenza-related diseases, transmission routes, and other basic information. In contrast, during the nonepidemic season, the most important keywords in the framework mainly focused on the category of influenza treatment. It covered the use of medications, treatment protocols, and other content. This suggests that there are remarkable differences in the public&#x2019;s concerns during different time periods. In addition, this study observed that the categories of keywords throughout the year mostly overlapped with those used during the epidemic season.</p></sec><sec id="s3-3"><title>CLSTM Performance for Prediction</title><sec id="s3-3-1"><title>Testing the Prediction Results for Different Times in Advance and Various Study Periods</title><p>This study used CLSTM for ILI% prediction, with hyperparameter settings detailed in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>. First, the original ILI% was solely input into the framework as the common standard for predicting the ILI% trend. Second, the ILI % was simultaneously input into the framework with a Baidu index with a correlation coefficient above 0.5. The study conducted experiments on 4 different study periods (all-time period, epidemic + nonepidemic period, epidemic period, and nonepidemic period) by adding only ILI% for prediction and ILI% + Baidu index.</p><p>It was found that the prediction of ILI% after dividing the epidemic and nonepidemic seasons was better than that of the all-time period (<xref ref-type="fig" rid="figure4">Figure 4</xref> and <xref ref-type="table" rid="table2">Table 2</xref>). In particular, the effects of 1-week and 2-week lag predictions were more stable (lag 1 of ILI% in period 2: MAPE=10.730%, MSE=0.884, MAE=0.649, RMSE=0.940, and <italic>R</italic><sup>2</sup>=0.877; lag 1 of ILI% + Baidu index in period 2: MAPE=11.824%, MSE=1.243, MAE=0.723, RMSE=1.115, and <italic>R</italic><sup>2</sup>=0.827). On the prediction effect of ILI% 3-week lag, using only ILI% is better than ILI% + Baidu index (lag 3 of ILI% in period 2: MAPE=18.458%, MSE=2.623, MAE=1.053, RMSE=1.620, and <italic>R</italic><sup>2</sup>=0.635; lag 3 of ILI% + Baidu index in period 2: MAPE=18.260%, MSE=1.996, MAE=1.014, RMSE=1.413, and <italic>R</italic><sup>2</sup>=0.722; <xref ref-type="table" rid="table2">Table 2</xref>). In addition, it was found that the ILI% + Baidu index predicts better than only the ILI% regardless of the time period and lag time of the study (<xref ref-type="fig" rid="figure5">Figure 5</xref> and <xref ref-type="table" rid="table2">Table 2</xref>). The conclusions were general in nature and demonstrated stable model performance.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>The prediction results for different times in advance and various study periods for all-time period and epidemic + nonepidemic period. There are 3 columns on the graph, lag 1, lag 2, and lag 3, which represent the lag of the dependent variable (<bold><italic>Y</italic></bold>) relative to the independent variable (<bold><italic>X</italic></bold>) of order 1, 2, and 3. There are 2 rows on the graph; the first one is only ILI%, which indicates that only the ILI% indicator is involved in all the inputs and outputs of this framework variable. The second row is ILI% + Baidu, which indicates that the inputs and outputs of this framework variable have both the Baidu index and ILI% involved. The figure was conducted over 2 research periods. First, all-time period (the 11th week of 2022 to the 13th week of 2024). It is an initial time period without a division between epidemic and nonepidemic seasons. Second, epidemic + nonepidemic period (the 11th week of 2022 to the 13th week of 2024). This is represented by dividing the seasons, predicting the results using the respective data, and combining the predictions into a final time period. The 3 lines in the figure represent the predicted values of ILI% for the true value, all-time period, and epidemic + nonepidemic period, respectively. ILI%: percentage of influenza-like illness.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e71786_fig04.png"/></fig><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Prediction effects for different study periods and for different combinations of inputs<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup>.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom" colspan="5">ILI%<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="bottom" colspan="5">ILI% + Baidu index</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">MAPE (%)<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td><td align="left" valign="top">MSE<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup></td><td align="left" valign="top">MAE<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup></td><td align="left" valign="top">RMSE<sup><xref ref-type="table-fn" rid="table2fn6">f</xref></sup></td><td align="left" valign="top"><italic>R</italic><sup>2</sup></td><td align="left" valign="top">MAPE (%)</td><td align="left" valign="top">MSE</td><td align="left" valign="top">MAE</td><td align="left" valign="top">RMSE</td><td align="left" valign="top"><italic>R</italic><sup>2</sup></td></tr></thead><tbody><tr><td align="left" valign="top" colspan="11">Period 1: all-time</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lag 1</td><td align="left" valign="top">12.784</td><td align="left" valign="top">1.513</td><td align="left" valign="top">0.744</td><td align="left" valign="top">1.230</td><td align="left" valign="top">0.786</td><td align="left" valign="top">13.464</td><td align="left" valign="top">1.377</td><td align="left" valign="top">0.762</td><td align="left" valign="top">1.173</td><td align="left" valign="top">0.806</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lag 2</td><td align="left" valign="top">15.913</td><td align="left" valign="top">1.800</td><td align="left" valign="top">0.924</td><td align="left" valign="top">1.342</td><td align="left" valign="top">0.746</td><td align="left" valign="top">15.737</td><td align="left" valign="top">1.718</td><td align="left" valign="top">0.917</td><td align="left" valign="top">1.311</td><td align="left" valign="top">0.758</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lag 3</td><td align="left" valign="top">15.287</td><td align="left" valign="top">1.815</td><td align="left" valign="top">0.881</td><td align="left" valign="top">1.347</td><td align="left" valign="top">0.744</td><td align="left" valign="top">17.544</td><td align="left" valign="top">1.934</td><td align="left" valign="top">0.978</td><td align="left" valign="top">1.391</td><td align="left" valign="top">0.727</td></tr><tr><td align="left" valign="top" colspan="11">Period 2: epidemic + nonepidemic</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lag 1</td><td align="left" valign="top">10.730</td><td align="left" valign="top">0.884</td><td align="left" valign="top">0.649</td><td align="left" valign="top">0.940</td><td align="left" valign="top">0.877</td><td align="left" valign="top">11.824</td><td align="left" valign="top">1.243</td><td align="left" valign="top">0.723</td><td align="left" valign="top">1.115</td><td align="left" valign="top">0.827</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lag 2</td><td align="left" valign="top">13.257</td><td align="left" valign="top">1.681</td><td align="left" valign="top">0.858</td><td align="left" valign="top">1.297</td><td align="left" valign="top">0.766</td><td align="left" valign="top">13.235</td><td align="left" valign="top">1.522</td><td align="left" valign="top">0.816</td><td align="left" valign="top">1.234</td><td align="left" valign="top">0.788</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lag 3</td><td align="left" valign="top">18.458</td><td align="left" valign="top">2.623</td><td align="left" valign="top">1.053</td><td align="left" valign="top">1.620</td><td align="left" valign="top">0.635</td><td align="left" valign="top">18.260</td><td align="left" valign="top">1.996</td><td align="left" valign="top">1.014</td><td align="left" valign="top">1.413</td><td align="left" valign="top">0.722</td></tr><tr><td align="left" valign="top" colspan="11">Period 3: epidemic</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lag 1</td><td align="left" valign="top">12.089</td><td align="left" valign="top">2.001</td><td align="left" valign="top">0.831</td><td align="left" valign="top">1.415</td><td align="left" valign="top">0.818</td><td align="left" valign="top">11.966</td><td align="left" valign="top">1.603</td><td align="left" valign="top">0.782</td><td align="left" valign="top">1.266</td><td align="left" valign="top">0.854</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lag 2</td><td align="left" valign="top">14.436</td><td align="left" valign="top">2.189</td><td align="left" valign="top">0.955</td><td align="left" valign="top">1.480</td><td align="left" valign="top">0.801</td><td align="left" valign="top">14.707</td><td align="left" valign="top">1.864</td><td align="left" valign="top">0.934</td><td align="left" valign="top">1.365</td><td align="left" valign="top">0.831</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lag 3</td><td align="left" valign="top">20.637</td><td align="left" valign="top">3.286</td><td align="left" valign="top">1.203</td><td align="left" valign="top">1.813</td><td align="left" valign="top">0.702</td><td align="left" valign="top">22.368</td><td align="left" valign="top">2.865</td><td align="left" valign="top">1.232</td><td align="left" valign="top">1.693</td><td align="left" valign="top">0.740</td></tr><tr><td align="left" valign="top" colspan="11">Period 4: nonepidemic</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lag 1</td><td align="left" valign="top">9.218</td><td align="left" valign="top">0.478</td><td align="left" valign="top">0.548</td><td align="left" valign="top">0.691</td><td align="left" valign="top">0.813</td><td align="left" valign="top">8.480</td><td align="left" valign="top">0.378</td><td align="left" valign="top">0.479</td><td align="left" valign="top">0.615</td><td align="left" valign="top">0.852</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lag 2</td><td align="left" valign="top">10.189</td><td align="left" valign="top">0.607</td><td align="left" valign="top">0.612</td><td align="left" valign="top">0.779</td><td align="left" valign="top">0.763</td><td align="left" valign="top">9.753</td><td align="left" valign="top">0.574</td><td align="left" valign="top">0.555</td><td align="left" valign="top">0.758</td><td align="left" valign="top">0.775</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Lag 3</td><td align="left" valign="top">10.863</td><td align="left" valign="top">0.733</td><td align="left" valign="top">0.638</td><td align="left" valign="top">0.856</td><td align="left" valign="top">0.713</td><td align="left" valign="top">11.634</td><td align="left" valign="top">0.715</td><td align="left" valign="top">0.670</td><td align="left" valign="top">0.846</td><td align="left" valign="top">0.720</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>The study was conducted over 4 research periods. Period 1: all-time period (the 11th week of 2022 to the 13th week of 2024). It is an initial time period without a division between epidemic and nonepidemic seasons. Period 2: epidemic + nonepidemic period (the 11th week of 2022 to the 13th week of 2024). This is represented by dividing the seasons, predicting the results using the respective data, and combining the predictions into a final time period. Period 3: epidemic period (the 11th week of 2022 to the 13th week of 2022, the 40th week of 2022 to the 13th week of 2023, and the 40th week of 2023 to the 13th week of 2024). It indicates the time period of the epidemic season. Period 4: nonepidemic period (the 14th week of 2022 to the 39th week of 2022, and the 14th week of 2023 to the 39th week of 2023). It indicates the time period of the nonepidemic season.</p></fn><fn id="table2fn2"><p><sup>b</sup>ILI%: percentage of influenza-like illness.</p></fn><fn id="table2fn3"><p><sup>c</sup>MAPE: mean absolute percentage error.</p></fn><fn id="table2fn4"><p><sup>d</sup>MSE: mean square error.</p></fn><fn id="table2fn5"><p><sup>e</sup>MAE: mean absolute error.</p></fn><fn id="table2fn6"><p><sup>f</sup>RMSE: root-mean-square error.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>The prediction results for different times in advance and various study periods for only ILI% and ILI% + Baidu. There are 3 columns on the graph, lag 1, lag 2, and lag 3, which represent the lag of the dependent variable (<bold><italic>Y</italic></bold>) relative to the independent variable (<bold><italic>X</italic></bold>) of order 1, 2, and 3. The figure was conducted over 3 research periods. First, all-time period (the 11th week of 2022 to the 13th week of 2024). It is an initial time period without a division between epidemic and nonepidemic seasons. Second, epidemic season (the 11th week of 2022 to the 13th week of 2022, the 40th week of 2022 to the 13th week of 2023, and the 40th week of 2023 to the 13th week of 2024). It indicates the time period of the epidemic season. Third, nonepidemic season (the 14th week of 2022 to the 39th week of 2022, the 14th week of 2023 to the 39th week of 2023). It indicates the time period of the nonepidemic season. There are 3 rows on the chart, each representing 3 time periods. The 3 lines on each graph are the predicted values of ILI% at the true value, the case where only ILI% is the variable, and the case where ILI% + Baidu is the variable, respectively. ILI%: percentage of influenza-like illness.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e71786_fig05.png"/></fig><p>CLSTM demonstrates robust reliability for 1-week-ahead ILI% predictions using ILI% + Baidu index data in 4 periods (all-time, epidemic + nonepidemic, epidemic, and nonepidemic periods). The overall prediction errors exhibit a median near zero with reasonable distribution ranges (<xref ref-type="fig" rid="figure6">Figure 6</xref>). Notably, the model maintains stable performance even during the most challenging epidemic period, while achieving tighter error distributions in the nonepidemic period. These results confirm the practical reliability of our integrated model for real-world influenza surveillance applications.</p><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>Convolutional long short-term memory prediction error distribution in 1-week-ahead ILI% predictions using ILI% + Baidu index. Four different periods: all-time, epidemic + nonepidemic, epidemic, and nonepidemic. Each period is represented by a box plot, where the green horizontal line indicates the median of the data, the blue box represents the interquartile range from the first quartile (<bold>Q1</bold>) to the third quartile (<bold>Q3</bold>), and any data points outside the whiskers are marked with circles, indicating potential outliers. ILI%: percentage of influenza-like illness.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e71786_fig06.png"/></fig></sec><sec id="s3-3-2"><title>Explainability of Model Predictions</title><p>To validate the prediction reliability of the model, SHAP analysis was used to assess feature importance based on ILI% + Baidu index data in epidemic + nonepidemic period. The results demonstrate that both the Baidu index (SHAP value=2.487) and the ILI% (SHAP value=3.172) contribute significantly to the predictive outcomes (<xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>). While ILI% exhibits slightly higher importance, the Baidu index provides complementary search behavior data that effectively compensate for the limitations of traditional surveillance indicators, particularly in capturing early warning signals. This finding confirms the value of integrating web-based search data with conventional epidemiological data, offering more comprehensive support for influenza forecasting.</p></sec><sec id="s3-3-3"><title>Hyperparameter Sensitivity Analysis</title><p>This study conducted a hyperparameter sensitivity analysis for 1-week-ahead ILI% predictions using ILI% + Baidu index data in epidemic + nonepidemic period to evaluate 3 key parameters (<xref ref-type="table" rid="table3">Table 3</xref>): the number of attention heads (Num_head) in transformer, the kernel size (Kernel) in convolutional neural networks, and the number of layers (Num_layer) in LSTM. While holding 2 hyperparameters constant, it systematically varied the third hyperparameter and evaluated model performance. This procedure yielded a total of 7 comparative experiments for hyperparameter sensitivity analysis. The experimental results demonstrated that the optimal configuration (Num_head=8, Kernel=9, and Num_layer=2) achieved superior performance across all evaluation metrics. Based on these findings, this study implemented this optimal hyperparameter configuration in the final model to ensure robust predictive performance.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Hyperparameter sensitivity analysis of convolutional long short-term memory.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" colspan="3">Hyperparameter</td><td align="left" valign="bottom">MAPE<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup> (%)</td><td align="left" valign="bottom">MSE<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup></td><td align="left" valign="bottom">MAE<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td><td align="left" valign="bottom">RMSE<sup><xref ref-type="table-fn" rid="table3fn7">g</xref></sup></td><td align="left" valign="bottom"><italic>R</italic><sup>2</sup></td></tr><tr><td align="left" valign="bottom">Num_head<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="bottom">Kernel<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td><td align="left" valign="bottom">Num_layer<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="left" valign="bottom"/><td align="left" valign="bottom"/><td align="left" valign="bottom"/><td align="left" valign="bottom"/><td align="left" valign="bottom"/></tr></thead><tbody><tr><td align="char" char="." valign="top">4</td><td align="char" char="." valign="top">9</td><td align="char" char="." valign="top">2</td><td align="left" valign="top">11.831</td><td align="left" valign="top">1.518</td><td align="left" valign="top">0.757</td><td align="left" valign="top">1.232</td><td align="left" valign="top">0.826</td></tr><tr><td align="char" char="." valign="top">8</td><td align="char" char="." valign="top">9</td><td align="char" char="." valign="top">2</td><td align="left" valign="top">11.824</td><td align="left" valign="top">1.243</td><td align="left" valign="top">0.723</td><td align="left" valign="top">1.115</td><td align="left" valign="top">0.827</td></tr><tr><td align="char" char="." valign="top">16</td><td align="char" char="." valign="top">9</td><td align="char" char="." valign="top">2</td><td align="left" valign="top">12.554</td><td align="left" valign="top">1.692</td><td align="left" valign="top">0.833</td><td align="left" valign="top">1.301</td><td align="left" valign="top">0.801</td></tr><tr><td align="char" char="." valign="top">8</td><td align="char" char="." valign="top">1</td><td align="char" char="." valign="top">2</td><td align="left" valign="top">14.695</td><td align="left" valign="top">2.408</td><td align="left" valign="top">0.969</td><td align="left" valign="top">1.552</td><td align="left" valign="top">0.781</td></tr><tr><td align="char" char="." valign="top">8</td><td align="char" char="." valign="top">3</td><td align="char" char="." valign="top">2</td><td align="left" valign="top">15.570</td><td align="left" valign="top">2.603</td><td align="left" valign="top">1.103</td><td align="left" valign="top">1.613</td><td align="left" valign="top">0.764</td></tr><tr><td align="char" char="." valign="top">8</td><td align="char" char="." valign="top">9</td><td align="char" char="." valign="top">2</td><td align="left" valign="top">11.824</td><td align="left" valign="top">1.243</td><td align="left" valign="top">0.723</td><td align="left" valign="top">1.115</td><td align="left" valign="top">0.827</td></tr><tr><td align="char" char="." valign="top">8</td><td align="char" char="." valign="top">9</td><td align="char" char="." valign="top">2</td><td align="left" valign="top">11.824</td><td align="left" valign="top">1.243</td><td align="left" valign="top">0.723</td><td align="left" valign="top">1.115</td><td align="left" valign="top">0.827</td></tr><tr><td align="char" char="." valign="top">8</td><td align="char" char="." valign="top">9</td><td align="char" char="." valign="top">3</td><td align="left" valign="top">11.934</td><td align="left" valign="top">1.580</td><td align="left" valign="top">0.769</td><td align="left" valign="top">1.257</td><td align="left" valign="top">0.817</td></tr><tr><td align="char" char="." valign="top">8</td><td align="char" char="." valign="top">9</td><td align="char" char="." valign="top">4</td><td align="left" valign="top">17.100</td><td align="left" valign="top">2.742</td><td align="left" valign="top">1.137</td><td align="left" valign="top">1.656</td><td align="left" valign="top">0.751</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup> Num_head: the number of attention heads in transformer.</p></fn><fn id="table3fn2"><p><sup>b</sup>Kernel: the kernel size in convolutional neural networks.</p></fn><fn id="table3fn3"><p><sup>c</sup>Num_layer: the number of layers in long short-term memory.</p></fn><fn id="table3fn4"><p><sup>d</sup>MAPE: mean absolute percentage error.</p></fn><fn id="table3fn5"><p><sup>e</sup>MSE: mean square error.</p></fn><fn id="table3fn6"><p><sup>f</sup>MAE: mean absolute error.</p></fn><fn id="table3fn7"><p><sup>g</sup>RMSE: root-mean-square error.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s3-4"><title>Comparisons With Other Methods</title><sec id="s3-4-1"><title>Models&#x2019; Performance for Prediction</title><p>The comparative performance evaluation of CLSTM against traditional LSTM and transformer architectures was conducted for 1-week-ahead ILI% predictions using ILI% + Baidu index data in epidemic + nonepidemic period (<xref ref-type="table" rid="table4">Table 4</xref> and <xref ref-type="fig" rid="figure7">Figure 7</xref>). Quantitative analysis revealed that CLSTM consistently outperformed baseline models across all evaluation metrics, achieving superior performance in prediction accuracy (MSE: 1.243 vs 2.230/2.009; MAE: 0.723 vs 0.654/0.705; and RMSE: 1.115 vs 1.493/1.417), stability (MAPE: 11.824% vs 14.458%/13.561%), and explanatory power (<italic>R</italic>&#x00B2;: 0.827 vs 0.744/0.803). The performance advantage was particularly pronounced during interseasonal transitions between epidemic and nonepidemic periods, demonstrating CLSTM&#x2019;s enhanced capability in modeling complex nonlinear relationships and long-term temporal dependencies inherent in syndromic surveillance data. These results substantiate the effectiveness of our proposed architecture for ILI prediction tasks under real-world surveillance scenarios.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Evaluation metrics of 3 model prediction performance<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup>.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">MAPE<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup> (%)</td><td align="left" valign="bottom">MSE<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="bottom">MAE<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup></td><td align="left" valign="bottom">RMSE<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup></td><td align="left" valign="bottom"><italic>R</italic><sup>2</sup></td></tr></thead><tbody><tr><td align="left" valign="top">LSTM<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup></td><td align="left" valign="top">14.458</td><td align="left" valign="top">2.230</td><td align="left" valign="top">0.654</td><td align="left" valign="top">1.493</td><td align="left" valign="top">0.744</td></tr><tr><td align="left" valign="top">Transformer</td><td align="left" valign="top">13.561</td><td align="left" valign="top">2.009</td><td align="left" valign="top">0.705</td><td align="left" valign="top">1.417</td><td align="left" valign="top">0.803</td></tr><tr><td align="left" valign="top">CLSTM<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td><td align="left" valign="top">11.824</td><td align="left" valign="top">1.243</td><td align="left" valign="top">0.723</td><td align="left" valign="top">1.115</td><td align="left" valign="top">0.827</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>The comparative performance evaluation of convolutional long short-term memory against traditional long short-term memory and transformer architectures was conducted for 1-week-ahead percentage of  influenza-like illness  predictions using the percentage of influenza-like illness  + Baidu index data in epidemic + nonepidemic period.</p></fn><fn id="table4fn2"><p><sup>b</sup>MAPE: mean absolute percentage error.</p></fn><fn id="table4fn3"><p><sup>c</sup>MSE: mean square error.</p></fn><fn id="table4fn4"><p><sup>d</sup>MAE: mean absolute error.</p></fn><fn id="table4fn5"><p><sup>e</sup> RMSE: root-mean-square error.</p></fn><fn id="table4fn6"><p><sup>f</sup>LSTM: long short-term memory.</p></fn><fn id="table4fn7"><p><sup>g</sup>CLSTM: convolutional long short-term memory.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure7"><label>Figure 7.</label><caption><p>Comparison of 3 model prediction performance for 1-week-ahead ILI% predictions using ILI% + Baidu index data in epidemic + nonepidemic period. CLSTM: convolutional long short-term memory; ILI%: percentage of influenza-like illness; LSTM: long short-term memory.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e71786_fig07.png"/></fig></sec><sec id="s3-4-2"><title>Model Computational Efficiency and Complexity Analysis</title><sec id="s3-4-2-1"><title>Model Computational Efficiency</title><p>For model computational efficiency, the study used FLOPs and the number of parameters as evaluation metrics (<xref ref-type="table" rid="table5">Table 5</xref>). FLOPs can be used to measure computational efficiency because it directly reflects the amount of computational resources and processing speed required by the model when performing computational tasks. Similarly, parameters indicate the model&#x2019;s complexity and memory footprint, which are crucial for practical deployment. The results show that while the CLSTM model has a higher FLOPs value (0.40G) than the LSTM (0.08G), it is still lower than the transformer&#x2019;s FLOPs (0.48G). Additionally, the CLSTM model has fewer parameters (2.88M) than the transformer (3.44M) but more than the LSTM (0.47M). This indicates that CLSTM achieves a good balance between computational complexity, memory usage, and performance.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Model computational complexity analysis.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">FLOPs<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup> (GB)</td><td align="left" valign="bottom">Parameters (MB)</td><td align="left" valign="bottom">Big-O</td></tr></thead><tbody><tr><td align="left" valign="top">LSTM<sup><xref ref-type="table-fn" rid="table5fn2">b</xref></sup></td><td align="left" valign="top">0.08</td><td align="left" valign="top">0.47</td><td align="left" valign="top">O (T<sup><xref ref-type="table-fn" rid="table5fn3">c</xref></sup>&#x00B7;d&#x00B2;<sup><xref ref-type="table-fn" rid="table5fn4">d</xref></sup>)</td></tr><tr><td align="left" valign="top">Transformer</td><td align="left" valign="top">0.48</td><td align="left" valign="top">3.44</td><td align="left" valign="top">O (N&#x00B7;T&#x00B2;&#x00B7;d)</td></tr><tr><td align="left" valign="top">CLSTM<sup><xref ref-type="table-fn" rid="table5fn5">e</xref></sup></td><td align="left" valign="top">0.40</td><td align="left" valign="top">2.88</td><td align="left" valign="top">O (E<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup> &#x00B7;n&#x00B7;m&#x00B7;k&#x00B7;(<italic>f</italic>+h<sup><xref ref-type="table-fn" rid="table5fn7">g</xref></sup>))</td></tr></tbody></table><table-wrap-foot><fn id="table5fn1"><p><sup>a</sup>FLOPs: floating-point operations per second.</p></fn><fn id="table5fn2"><p><sup>b</sup>LSTM: long short-term memory.</p></fn><fn id="table5fn3"><p><sup>c</sup> T: input sequence length.</p></fn><fn id="table5fn4"><p><sup>d</sup>d: input feature dimension.</p></fn><fn id="table5fn5"><p><sup>e</sup>CLSTM: convolutional long short-term memory.</p></fn><fn id="table5fn6"><p><sup>f</sup>E: epoch.</p></fn><fn id="table5fn7"><p><sup>g</sup>h: hidden state dimension.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-4-2-2"><title>Model Computational Complexity Analysis</title><p>The computational complexity analysis reveals the performance differences among LSTM, transformer, and CLSTM (<xref ref-type="table" rid="table5">Table 5</xref>). First, LSTM&#x2019;s O(T&#x00B7;d&#x00B2;) limits its scalability with high-dimensional data; second, transformer&#x2019;s O(N&#x00B7;T&#x00B2;&#x00B7;d) incurs higher computational costs due to the number of attention heads. In contrast, CLSTM&#x2019;s O (E&#x00B7;n&#x00B7;m&#x00B7;k&#x00B7;(<italic>f</italic>+h)), although influenced by multiple factors, can achieve greater efficiency through optimization of batch size and filter dimensions. It can make it more scalable for tasks involving complex features and long sequences. The derivation process for the Big-O complexity estimation is shown in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>.</p></sec></sec></sec><sec id="s3-5"><title>Comparing Training Stability Across Different Influenza Periods</title><p>To compare the training stability of models across epidemic and nonepidemic periods, this study presents the loss functions of 3 models (CLSTM, transformer, and LSTM) (<xref ref-type="fig" rid="figure8">Figure 8A and B</xref>). Comparative analysis revealed consistent performance rankings: transformer achieved optimal convergence, LSTM exhibited the weakest performance, and CLSTM maintained robust intermediate performance. CLSTM demonstrated remarkable stability despite seasonal variations in data distribution, highlighting superior robustness and cross-distribution adaptability. All-time period convergence analysis (<xref ref-type="supplementary-material" rid="app7">Multimedia Appendix 7</xref>) yielded consistent results with seasonal evaluations.</p><fig position="float" id="figure8"><label>Figure 8.</label><caption><p>Loss functions of 3 models (CLSTM, transformer, and LSTM). (A) Epidemic period. (B) Nonepidemic period. CLSTM: convolutional long short-term memory; LSTM: long short-term memory.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e71786_fig08.png"/></fig></sec><sec id="s3-6"><title>External Validation</title><p>To further validate the generalizability of the CLSTM model, the study conducted additional experiments using ILI% from Tianjin and corresponding Baidu index data. The model demonstrated robust performance for 1-week-ahead ILI% predictions using ILI% + Baidu index data in epidemic + nonepidemic period (<xref ref-type="table" rid="table6">Table 6</xref>), achieving an <italic>R</italic>&#x00B2; of 0.755 &#x003E;0.7, MAPE of 17.832% &#x003C;20%, and low error metrics (RMSE=1.716, MSE=2.943, and MAE=1.216). These results indicate the model&#x2019;s strong predictive capability on external datasets. Comparative analysis revealed the CLSTM model&#x2019;s superior performance over LSTM and transformer. It confirmed the model&#x2019;s enhanced ability to capture spatiotemporal patterns in ILI transmission.</p><table-wrap id="t6" position="float"><label>Table 6.</label><caption><p>Evaluation metrics of 3 model prediction performance in external validation<sup><xref ref-type="table-fn" rid="table6fn1">a</xref></sup>.</p></caption><table id="table6" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">MAPE<sup><xref ref-type="table-fn" rid="table6fn2">b</xref></sup> (%)</td><td align="left" valign="bottom">MSE<sup><xref ref-type="table-fn" rid="table6fn3">c</xref></sup></td><td align="left" valign="bottom">MAE<sup><xref ref-type="table-fn" rid="table6fn4">d</xref></sup></td><td align="left" valign="bottom">RMSE<sup><xref ref-type="table-fn" rid="table6fn5">e</xref></sup></td><td align="left" valign="bottom"><italic>R</italic><sup>2</sup></td></tr></thead><tbody><tr><td align="left" valign="top">LSTM<sup><xref ref-type="table-fn" rid="table6fn6">f</xref></sup></td><td align="left" valign="top">26.458</td><td align="left" valign="top">4.065</td><td align="left" valign="top">2.988</td><td align="left" valign="top">2.016</td><td align="left" valign="top">0.700</td></tr><tr><td align="left" valign="top">Transformer</td><td align="left" valign="top">21.887</td><td align="left" valign="top">3.111</td><td align="left" valign="top">2.001</td><td align="left" valign="top">1.764</td><td align="left" valign="top">0.743</td></tr><tr><td align="left" valign="top">CLSTM<sup><xref ref-type="table-fn" rid="table6fn7">g</xref></sup></td><td align="left" valign="top">17.832</td><td align="left" valign="top">2.943</td><td align="left" valign="top">1.216</td><td align="left" valign="top">1.716</td><td align="left" valign="top">0.755</td></tr></tbody></table><table-wrap-foot><fn id="table6fn1"><p><sup>a</sup>The comparative performance evaluation of convolutional long short-term memory against traditional long short-term memory and transformer architectures was conducted for 1-week-ahead percentage of influenza-like illness  predictions using the percentage of influenza-like illness  + Baidu index data in epidemic + nonepidemic period.</p></fn><fn id="table6fn2"><p><sup>b</sup>MAPE: mean absolute percentage error.</p></fn><fn id="table6fn3"><p><sup>c</sup>MSE: mean square error.</p></fn><fn id="table6fn4"><p><sup>d</sup>MAE: mean absolute error.</p></fn><fn id="table6fn5"><p><sup>e</sup>RMSE: root-mean-square error.</p></fn><fn id="table6fn6"><p><sup>f</sup>LSTM: long short-term memory.</p></fn><fn id="table6fn7"><p><sup>g</sup>CLSTM: convolutional long short-term memory.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>Although current models of transmission epidemiology largely rely on surveillance data and mathematical models, there have been many studies exploring the potential of alternative data sources and machine learning techniques. This study integrates Baidu index data with traditional surveillance data to propose a deep learning framework that uses multifeatured time series for different influenza epidemic states. By considering the impacts of both epidemic and nonepidemic seasons, the framework enhances the accuracy of influenza predictions. Analysis revealed that the weekly search volumes for 4 types of Baidu search terms related to influenza&#x2014;essential facts, symptoms, treatment, and prevention&#x2014;were strongly correlated with ILI%. By distinguishing between epidemic and nonepidemic seasons, this study found that these search terms had different focuses during each period. Based on these findings, we developed a CLSTM deep learning framework using multifeatured time series from multiple data sources. The study was conducted over 4 research periods: all time periods, the combined epidemic and nonepidemic periods, the epidemic period, and the nonepidemic period. The framework can predict influenza trends up to 2 weeks in advance. This research investigates the application of combining public opinion data with traditional surveillance systems to predict influenza epidemics. It provides a valuable reference not only for northern China but also for advancements in modern surveillance methods.</p><p>Dividing the study period into epidemic and nonepidemic seasons can more accurately capture the seasonal characteristics of the public&#x2019;s search behavior for influenza information (Baidu index). The ILI% was used to predict trends in influenza virus incidence [<xref ref-type="bibr" rid="ref32">32</xref>]. An increase in the ILI% usually signals the peak of an influenza pandemic, and health care providers and public health departments can take timely action based on the change in the ILI% to intensify their influenza prevention and treatment efforts. Nevertheless, influenza risks vary during different seasons. Therefore, dividing the study period into epidemic and nonepidemic seasons better captures seasonal variations in public concern and search behavior, which are crucial for predicting influenza trends. During the influenza epidemic season, members of the public, with heightened crisis awareness and perceived increased risk of contracting influenza, proactively obtain relevant information for self-assessment and prevention. Specifically, they pay attention to the symptoms of influenza for self-diagnosis, learn about transmission routes to prevent infection, and seek preventive measures to protect themselves. These behaviors led to a significant increase in Baidu search terms related to influenza essential facts and prevention, which in turn led to an increase in the Baidu index. In addition, extensive media coverage of influenza cases and outbreak developments also increased public attention. Public health departments usually promote preventive measures such as vaccination and hand hygiene during the epidemic season, which further directs the public to search for related information. In contrast, during the nonepidemic season, the public is relatively less aware of the crisis and less worried about the risk of contracting influenza. In this case, they mainly focus on information related to influenza treatment. Therefore, Baidu search terms focus more on recognizing influenza symptoms, choosing treatments, and effective medications. Media reports and other health information received relatively less attention, while public interest in vaccination and preventive measures declined. Overall, public attention during the nonepidemic season shifted more toward the influenza treatment.</p><p>The inclusion of Baidu index is effective for ILI% prediction. Using separate Baidu search terms for epidemic and nonepidemic seasons will improve prediction performance. The search engine data, as a leading signal of influenza trends, can sense the spreading trend of influenza earlier than the ILI% [<xref ref-type="bibr" rid="ref27">27</xref>]. Baidu index is a globally applicable big data tool, widely used in Baidu-dominated regions (eg, parts of Asia and South America). By the second quarter of 2025, Baidu will have a wide range of active users globally. Baidu operates similarly to Google Trends and other international search indices, making the model adaptable to local platforms (eg, Naver in Korea) without algorithmic modifications. Currently, Baidu index has been used in deep learning&#x2013;based prediction of influenza on several occasions [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. Search terms filtered from Baidu index are often divided into 4 categories [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]: basic understanding of influenza, symptoms, treatment and medicine, and prevention. It is generally consistent with this study&#x2019;s categorization of influenza-related terms.</p><p>At the same time, it is necessary to study influenza prediction using deep learning algorithms. Yang et al [<xref ref-type="bibr" rid="ref34">34</xref>] used data from northern and southern China and integrated a model based on gated recurrent units and multiple attention mechanisms to achieve approximately 2 weeks&#x2019; prediction, with an <italic>R</italic>&#x00B2; value exceeding 0.77. Jung et al [<xref ref-type="bibr" rid="ref36">36</xref>] used a self-attention mechanism-based deep learning model to predict influenza trends, demonstrating significant effectiveness. Additionally, studies [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref33">33</xref>] combined ILI case, virological surveillance, climate, demographic, and search engine data. They applied LSTM models to predict ILI%, achieving <italic>R</italic>&#x00B2; values from 0.67 to 0.9. Athanasiou et al [<xref ref-type="bibr" rid="ref35">35</xref>] used weekly ILI monitoring data and multisource data, including Twitter and weather conditions, to predict ILI% in Greece with an LSTM model. In this study, using only Baidu index and traditional monitoring data, the CLSTM framework predicted ILI% in 1-2 weeks. The framework&#x2019;s <italic>R</italic><sup>2</sup> value exceeded 0.82, outperforming most studies using multisource data. Comparative analysis demonstrates that CLSTM achieves better performance to classical machine learning models in terms of computational efficiency, complexity, extrapolation capability, and stability.</p><p>It was found that the current papers rarely achieve more than 3 weeks of accurate prediction, which is deemed ineffective [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. The Baidu index reflects public search behavior for influenza-related information. It typically increases 1-2 weeks before an outbreak and weakens afterward, reducing predictive effectiveness. Traditional ILI% surveillance data are more reliable for longer-term predictions and provide comprehensive information.</p><p>Most influenza prediction studies do not divide epidemic and nonepidemic seasons. This study found that using specific Baidu search terms for each period significantly improves prediction performance and reliability during single epidemic or nonepidemic seasons. This approach allows the framework to capture season-specific patterns more accurately, providing reliable and detailed prediction results.</p></sec><sec id="s4-2"><title>Limitations and Future Works</title><p>However, this study had a few limitations. First, this study did not separately consider the effect of the COVID-19 pandemic on ILI% but allowed the framework to learn from existing trends. Second, computational challenges (eg, real-time latency) must be addressed through optimization and cloud solutions.</p><p>To enhance robustness, future work should explore the following: first, hybrid artificial intelligence strategies (eg, reinforcement learning) for dynamic parameter tuning; second, multisource data integration (social media, electronic health records, and climate variables) to improve sensitivity and reduce confounders; and third, federated learning for privacy-preserving cross-region collaboration, despite computational inequities.</p></sec><sec id="s4-3"><title>Conclusions</title><p>In summary, this study demonstrates significant potential for influenza prediction by integrating Baidu index with traditional surveillance data and specific keywords (for both epidemic and nonepidemic seasons). The CLSTM framework performed exceptionally well, effectively improving prediction accuracy through the use of seasonal Baidu search terms, thereby offering a novel perspective for public health early warning systems. Although Baidu&#x2019;s search engine is widely used internationally, its data are subject to demographic, geographical, and media-driven biases, necessitating population-weighting adjustments and integration with traditional surveillance data to mitigate prediction distortions. Future efforts will focus on further optimizing the model to achieve more timely and accurate predictions: on one hand, leveraging transfer learning to extend this framework to other disease predictions, and on the other hand, using multiobjective optimization to balance accuracy and interpretability. It will ultimately enhance public health response capabilities.</p></sec></sec></body><back><notes><sec><title>Data Availability</title><p>The data presented in this study are available from the corresponding author on reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>JL and XY contributed to conceptualization, data curation, formal analysis, investigation, writing&#x2014;original draft, and writing&#x2014;review and editing. XC, YZ, and GL assisted with writing&#x2014;review and editing. LL, YL, and XD handled formal analysis. ZM, ZL, JY, and XS contributed to data curation and formal analysis. CC contributed to conceptualization, supervision, and writing&#x2014;review and editing.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">CLSTM</term><def><p>convolutional long short-term memory</p></def></def-item><def-item><term id="abb2">FLOP</term><def><p>floating-point operation per second</p></def></def-item><def-item><term id="abb3">ILI</term><def><p>influenza-like illness</p></def></def-item><def-item><term id="abb4">ILI%</term><def><p>percentage of influenza-like illness</p></def></def-item><def-item><term id="abb5">LSTM</term><def><p>long short-term memory</p></def></def-item><def-item><term id="abb6">MAE</term><def><p>mean absolute error</p></def></def-item><def-item><term id="abb7">MAPE</term><def><p>mean absolute percentage error</p></def></def-item><def-item><term id="abb8">MSE</term><def><p>mean square error</p></def></def-item><def-item><term id="abb9">NIDRIS</term><def><p>National Notifiable Infectious Disease Reporting System</p></def></def-item><def-item><term id="abb10">RMSE</term><def><p>root-mean-square error</p></def></def-item><def-item><term id="abb11">SHAP</term><def><p>Shapley Additive Explanations</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Iuliano</surname><given-names>AD</given-names> </name><name name-style="western"><surname>Roguski</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>HH</given-names> </name><etal/></person-group><article-title>Estimates of global seasonal influenza-associated respiratory mortality: a modelling study</article-title><source>Lancet</source><year>2018</year><month>03</month><day>31</day><volume>391</volume><issue>10127</issue><fpage>1285</fpage><lpage>1300</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(17)33293-2</pub-id><pub-id pub-id-type="medline">29248255</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Krammer</surname><given-names>F</given-names> </name><name name-style="western"><surname>Smith</surname><given-names>GJD</given-names> </name><name name-style="western"><surname>Fouchier</surname><given-names>RAM</given-names> </name><etal/></person-group><article-title>Influenza</article-title><source>Nat Rev Dis Primers</source><year>2018</year><month>06</month><day>28</day><volume>4</volume><issue>1</issue><fpage>3</fpage><pub-id pub-id-type="doi">10.1038/s41572-018-0002-y</pub-id><pub-id pub-id-type="medline">29955068</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Caceres</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Seibert</surname><given-names>B</given-names> </name><name name-style="western"><surname>Cargnin Faccin</surname><given-names>F</given-names> </name><name name-style="western"><surname>Cardenas-Garcia</surname><given-names>S</given-names> </name><name name-style="western"><surname>Rajao</surname><given-names>DS</given-names> </name><name name-style="western"><surname>Perez</surname><given-names>DR</given-names> </name></person-group><article-title>Influenza antivirals and animal models</article-title><source>FEBS Open Bio</source><year>2022</year><month>06</month><volume>12</volume><issue>6</issue><fpage>1142</fpage><lpage>1165</lpage><pub-id pub-id-type="doi">10.1002/2211-5463.13416</pub-id><pub-id pub-id-type="medline">35451200</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>L</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Influenza-associated excess respiratory mortality in China, 2010-15: a population-based study</article-title><source>Lancet Public Health</source><year>2019</year><month>09</month><volume>4</volume><issue>9</issue><fpage>e473</fpage><lpage>e481</lpage><pub-id pub-id-type="doi">10.1016/S2468-2667(19)30163-X</pub-id><pub-id pub-id-type="medline">31493844</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="web"><article-title>Influenza weekly report [Web page in Chinese]</article-title><source>Chinese Center for Disease Control and Prevention</source><year>2025</year><month>01</month><day>16</day><access-date>2025-07-18</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://ivdc.chinacdc.cn/cnic/zyzx/lgzb/202501/t20250116_303896.htm">https://ivdc.chinacdc.cn/cnic/zyzx/lgzb/202501/t20250116_303896.htm</ext-link></comment></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="web"><article-title>Influenza (seasonal)</article-title><source>World Health Organization</source><year>2025</year><month>02</month><day>28</day><access-date>2025-07-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/news-room/fact-sheets/detail/influenza-(seasonal)">https://www.who.int/news-room/fact-sheets/detail/influenza-(seasonal)</ext-link></comment></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pearce</surname><given-names>N</given-names> </name><name name-style="western"><surname>Vandenbroucke</surname><given-names>JP</given-names> </name><name name-style="western"><surname>VanderWeele</surname><given-names>TJ</given-names> </name><name name-style="western"><surname>Greenland</surname><given-names>S</given-names> </name></person-group><article-title>Accurate statistics on COVID-19 are essential for policy guidance and decisions</article-title><source>Am J Public Health</source><year>2020</year><month>07</month><volume>110</volume><issue>7</issue><fpage>949</fpage><lpage>951</lpage><pub-id pub-id-type="doi">10.2105/AJPH.2020.305708</pub-id><pub-id pub-id-type="medline">32324422</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Santillana</surname><given-names>M</given-names> </name><name name-style="western"><surname>Nguyen</surname><given-names>AT</given-names> </name><name name-style="western"><surname>Louie</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Cloud-based electronic health records for real-time, region-specific influenza surveillance</article-title><source>Sci Rep</source><year>2016</year><month>05</month><day>11</day><volume>6</volume><issue>1</issue><fpage>25732</fpage><pub-id pub-id-type="doi">10.1038/srep25732</pub-id><pub-id pub-id-type="medline">27165494</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ginsberg</surname><given-names>J</given-names> </name><name name-style="western"><surname>Mohebbi</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Patel</surname><given-names>RS</given-names> </name><name name-style="western"><surname>Brammer</surname><given-names>L</given-names> </name><name name-style="western"><surname>Smolinski</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Brilliant</surname><given-names>L</given-names> </name></person-group><article-title>Detecting influenza epidemics using search engine query data</article-title><source>Nature New Biol</source><year>2009</year><month>02</month><volume>457</volume><issue>7232</issue><fpage>1012</fpage><lpage>1014</lpage><pub-id pub-id-type="doi">10.1038/nature07634</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Santillana</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kou</surname><given-names>SC</given-names> </name></person-group><article-title>Accurate estimation of influenza epidemics using Google search data via ARGO</article-title><source>Proc Natl Acad Sci U S A</source><year>2015</year><month>11</month><day>24</day><volume>112</volume><issue>47</issue><fpage>14473</fpage><lpage>14478</lpage><pub-id pub-id-type="doi">10.1073/pnas.1515373112</pub-id><pub-id pub-id-type="medline">26553980</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yuan</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Nsoesie</surname><given-names>EO</given-names> </name><name name-style="western"><surname>Lv</surname><given-names>B</given-names> </name><name name-style="western"><surname>Peng</surname><given-names>G</given-names> </name><name name-style="western"><surname>Chunara</surname><given-names>R</given-names> </name><name name-style="western"><surname>Brownstein</surname><given-names>JS</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Cowling</surname><given-names>BJ</given-names> </name></person-group><article-title>Monitoring influenza epidemics in China with search query from Baidu</article-title><source>PLoS One</source><year>2013</year><volume>8</volume><issue>5</issue><fpage>e64323</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0064323</pub-id><pub-id pub-id-type="medline">23750192</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Santillana</surname><given-names>M</given-names> </name><name name-style="western"><surname>Nguyen</surname><given-names>AT</given-names> </name><name name-style="western"><surname>Dredze</surname><given-names>M</given-names> </name><name name-style="western"><surname>Paul</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Nsoesie</surname><given-names>EO</given-names> </name><name name-style="western"><surname>Brownstein</surname><given-names>JS</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Salath&#x00E9;</surname><given-names>M</given-names> </name></person-group><article-title>Combining search, social media, and traditional data sources to improve influenza surveillance</article-title><source>PLoS Comput Biol</source><year>2015</year><month>10</month><volume>11</volume><issue>10</issue><fpage>e1004513</fpage><pub-id pub-id-type="doi">10.1371/journal.pcbi.1004513</pub-id><pub-id pub-id-type="medline">26513245</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zimmer</surname><given-names>C</given-names> </name><name name-style="western"><surname>Leuba</surname><given-names>SI</given-names> </name><name name-style="western"><surname>Yaesoubi</surname><given-names>R</given-names> </name><name name-style="western"><surname>Cohen</surname><given-names>T</given-names> </name></person-group><article-title>Use of daily Internet search query data improves real-time projections of influenza epidemics</article-title><source>J R Soc Interface</source><year>2018</year><month>10</month><day>10</day><volume>15</volume><issue>147</issue><fpage>20180220</fpage><pub-id pub-id-type="doi">10.1098/rsif.2018.0220</pub-id><pub-id pub-id-type="medline">30305417</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alessa</surname><given-names>A</given-names> </name><name name-style="western"><surname>Faezipour</surname><given-names>M</given-names> </name></person-group><article-title>A review of influenza detection and prediction through social networking sites</article-title><source>Theor Biol Med Model</source><year>2018</year><month>02</month><day>1</day><volume>15</volume><issue>1</issue><fpage>2</fpage><pub-id pub-id-type="doi">10.1186/s12976-017-0074-5</pub-id><pub-id pub-id-type="medline">29386017</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hu</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>F</given-names> </name><name name-style="western"><surname>Langley</surname><given-names>D</given-names> </name><name name-style="western"><surname>Avram</surname><given-names>A</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>M</given-names> </name></person-group><article-title>Prediction of influenza-like illness based on the improved artificial tree algorithm and artificial neural network</article-title><source>Sci Rep</source><year>2018</year><month>03</month><day>20</day><volume>8</volume><issue>1</issue><fpage>4895</fpage><pub-id pub-id-type="doi">10.1038/s41598-018-23075-1</pub-id><pub-id pub-id-type="medline">29559649</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hickmann</surname><given-names>KS</given-names> </name><name name-style="western"><surname>Fairchild</surname><given-names>G</given-names> </name><name name-style="western"><surname>Priedhorsky</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Forecasting the 2013-2014 influenza season using Wikipedia</article-title><source>PLoS Comput Biol</source><year>2015</year><month>05</month><volume>11</volume><issue>5</issue><fpage>e1004239</fpage><pub-id pub-id-type="doi">10.1371/journal.pcbi.1004239</pub-id><pub-id pub-id-type="medline">25974758</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Santillana</surname><given-names>M</given-names> </name><name name-style="western"><surname>Brownstein</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Gray</surname><given-names>J</given-names> </name><name name-style="western"><surname>Richardson</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kou</surname><given-names>SC</given-names> </name></person-group><article-title>Using electronic health records and Internet search information for accurate influenza forecasting</article-title><source>BMC Infect Dis</source><year>2017</year><month>05</month><day>8</day><volume>17</volume><issue>1</issue><fpage>332</fpage><pub-id pub-id-type="doi">10.1186/s12879-017-2424-7</pub-id><pub-id pub-id-type="medline">28482810</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lazer</surname><given-names>D</given-names> </name><name name-style="western"><surname>Kennedy</surname><given-names>R</given-names> </name><name name-style="western"><surname>King</surname><given-names>G</given-names> </name><name name-style="western"><surname>Vespignani</surname><given-names>A</given-names> </name></person-group><article-title>The parable of Google Flu: traps in big data analysis</article-title><source>Science</source><year>2014</year><month>03</month><day>14</day><volume>343</volume><issue>6176</issue><fpage>1203</fpage><lpage>1205</lpage><pub-id pub-id-type="doi">10.1126/science.1248506</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Viboud</surname><given-names>C</given-names> </name><name name-style="western"><surname>Charu</surname><given-names>V</given-names> </name><name name-style="western"><surname>Olson</surname><given-names>D</given-names> </name><etal/></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Goldstein</surname><given-names>E</given-names> </name></person-group><article-title>Demonstrating the use of high-volume electronic medical claims data to monitor local and regional influenza activity in the US</article-title><source>PLoS One</source><year>2014</year><volume>9</volume><issue>7</issue><fpage>e102429</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0102429</pub-id><pub-id pub-id-type="medline">25072598</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moss</surname><given-names>R</given-names> </name><name name-style="western"><surname>Zarebski</surname><given-names>A</given-names> </name><name name-style="western"><surname>Dawson</surname><given-names>P</given-names> </name><name name-style="western"><surname>McCaw</surname><given-names>JM</given-names> </name></person-group><article-title>Forecasting influenza outbreak dynamics in Melbourne from internet search query surveillance data</article-title><source>Influenza Other Respir Viruses</source><year>2016</year><month>07</month><volume>10</volume><issue>4</issue><fpage>314</fpage><lpage>323</lpage><pub-id pub-id-type="doi">10.1111/irv.12376</pub-id><pub-id pub-id-type="medline">26859411</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xu</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Gel</surname><given-names>YR</given-names> </name><name name-style="western"><surname>Ramirez Ramirez</surname><given-names>LL</given-names> </name><name name-style="western"><surname>Nezafati</surname><given-names>K</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Tsui</surname><given-names>KL</given-names> </name></person-group><article-title>Forecasting influenza in Hong Kong with Google search queries and statistical model fusion</article-title><source>PLoS One</source><year>2017</year><volume>12</volume><issue>5</issue><fpage>e0176690</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0176690</pub-id><pub-id pub-id-type="medline">28464015</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Adamidi</surname><given-names>ES</given-names> </name><name name-style="western"><surname>Mitsis</surname><given-names>K</given-names> </name><name name-style="western"><surname>Nikita</surname><given-names>KS</given-names> </name></person-group><article-title>Artificial intelligence in clinical care amidst COVID-19 pandemic: a systematic review</article-title><source>Comput Struct Biotechnol J</source><year>2021</year><volume>19</volume><fpage>2833</fpage><lpage>2850</lpage><pub-id pub-id-type="doi">10.1016/j.csbj.2021.05.010</pub-id><pub-id pub-id-type="medline">34025952</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="web"><source>Baidu index [Website in Chinese]</source><year>2024</year><month>03</month><day>31</day><access-date>2025-07-18</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://index.baidu.com/v2/index.html">https://index.baidu.com/v2/index.html</ext-link></comment></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="web"><article-title>Influenza diagnosis and treatment programme (2020 version) [Web page in Chinese]</article-title><source>The State Council of the People's Republic of China</source><year>2020</year><month>10</month><day>27</day><access-date>2025-07-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.gov.cn/zhengce/zhengceku/2020-11/05/content_5557639.htm">https://www.gov.cn/zhengce/zhengceku/2020-11/05/content_5557639.htm</ext-link></comment></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="web"><article-title>Influenza weekly report [Web page in Chinese]</article-title><source>Chinese Center for Disease Control and Prevention</source><year>2024</year><month>01</month><day>4</day><access-date>2025-07-18</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://ivdc.chinacdc.cn/cnic/zyzx/lgzb/202401/t20240104_271820.htm">https://ivdc.chinacdc.cn/cnic/zyzx/lgzb/202401/t20240104_271820.htm</ext-link></comment></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="web"><article-title>Technical guidelines for influenza vaccination in China [Web page in Chinese]</article-title><source>Chinese Center for Disease Control and Prevention</source><year>2023</year><month>09</month><day>5</day><access-date>2025-07-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://ivdc.chinacdc.cn/cnic/zyzx/jcfa/202405/t20240522_278672.htm">https://ivdc.chinacdc.cn/cnic/zyzx/jcfa/202405/t20240522_278672.htm</ext-link></comment></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="web"><article-title>Technical guidelines for national influenza surveillance [Web page in Chinese]</article-title><source>Chinese Center for Disease Control and Prevention</source><year>2017</year><month>09</month><day>30</day><access-date>2025-07-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://ivdc.chinacdc.cn/cnic/zyzx/jcfa/201709/t20170930_153976.htm">https://ivdc.chinacdc.cn/cnic/zyzx/jcfa/201709/t20170930_153976.htm</ext-link></comment></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liang</surname><given-names>F</given-names> </name><name name-style="western"><surname>Guan</surname><given-names>P</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>D</given-names> </name></person-group><article-title>Forecasting influenza epidemics by integrating internet search queries and traditional surveillance data with the support vector machine regression model in Liaoning, from 2011 to 2015</article-title><source>PeerJ</source><year>2018</year><volume>6</volume><fpage>e5134</fpage><pub-id pub-id-type="doi">10.7717/peerj.5134</pub-id><pub-id pub-id-type="medline">29967755</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>G</given-names> </name><name name-style="western"><surname>Tai</surname><given-names>Y</given-names> </name></person-group><article-title>Hourly stepwise forecasting for solar irradiance using integrated hybrid models CNN-LSTM-MLP combined with error correction and VMD</article-title><source>Energy Convers Manag</source><year>2023</year><month>03</month><volume>280</volume><fpage>116804</fpage><pub-id pub-id-type="doi">10.1016/j.enconman.2023.116804</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dou</surname><given-names>W</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>K</given-names> </name><name name-style="western"><surname>Shan</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Day-ahead Numerical Weather Prediction solar irradiance correction using a clustering method based on weather conditions</article-title><source>Appl Energy</source><year>2024</year><month>07</month><volume>365</volume><fpage>123239</fpage><pub-id pub-id-type="doi">10.1016/j.apenergy.2024.123239</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wei</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wenjing</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>The prediction of influenza-like illness using national influenza surveillance data and Baidu query data</article-title><source>BMC Public Health</source><year>2024</year><month>02</month><day>19</day><volume>24</volume><issue>1</issue><fpage>513</fpage><pub-id pub-id-type="doi">10.1186/s12889-024-17978-0</pub-id><pub-id pub-id-type="medline">38369456</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Su</surname><given-names>K</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Li</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Forecasting influenza activity using self-adaptive AI model and multi-source data in Chongqing, China</article-title><source>EBioMedicine</source><year>2019</year><month>09</month><volume>47</volume><fpage>284</fpage><lpage>292</lpage><pub-id pub-id-type="doi">10.1016/j.ebiom.2019.08.024</pub-id><pub-id pub-id-type="medline">31477561</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Li</surname><given-names>G</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Deep-learning model for influenza prediction from multisource heterogeneous data in a megacity: model development and evaluation</article-title><source>J Med Internet Res</source><year>2023</year><month>02</month><day>13</day><volume>25</volume><fpage>e44238</fpage><pub-id pub-id-type="doi">10.2196/44238</pub-id><pub-id pub-id-type="medline">36780207</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>T</given-names> </name><name name-style="western"><surname>Han</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Influenza epidemic trend surveillance and prediction based on search engine data: deep learning model study</article-title><source>J Med Internet Res</source><year>2023</year><month>10</month><day>17</day><volume>25</volume><fpage>e45085</fpage><pub-id pub-id-type="doi">10.2196/45085</pub-id><pub-id pub-id-type="medline">37847532</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Athanasiou</surname><given-names>M</given-names> </name><name name-style="western"><surname>Fragkozidis</surname><given-names>G</given-names> </name><name name-style="western"><surname>Zarkogianni</surname><given-names>K</given-names> </name><name name-style="western"><surname>Nikita</surname><given-names>KS</given-names> </name></person-group><article-title>Long short-term memory-based prediction of the spread of influenza-like illness leveraging surveillance, weather, and Twitter data: model development and validation</article-title><source>J Med Internet Res</source><year>2023</year><month>02</month><day>6</day><volume>25</volume><fpage>e42519</fpage><pub-id pub-id-type="doi">10.2196/42519</pub-id><pub-id pub-id-type="medline">36745490</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jung</surname><given-names>S</given-names> </name><name name-style="western"><surname>Moon</surname><given-names>J</given-names> </name><name name-style="western"><surname>Park</surname><given-names>S</given-names> </name><name name-style="western"><surname>Hwang</surname><given-names>E</given-names> </name></person-group><article-title>Self-attention-based deep learning network for regional influenza forecasting</article-title><source>IEEE J Biomed Health Inform</source><year>2022</year><month>02</month><volume>26</volume><issue>2</issue><fpage>922</fpage><lpage>933</lpage><pub-id pub-id-type="doi">10.1109/JBHI.2021.3093897</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Mathematical formulation of the convolutional long short-term memory framework.</p><media xlink:href="jmir_v27i1e71786_app1.docx" xlink:title="DOCX File, 42 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Model evaluation.</p><media xlink:href="jmir_v27i1e71786_app2.docx" xlink:title="DOCX File, 22 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Correlations between Baidu index and percentage of influenza-like illness in all-time period at different lags.</p><media xlink:href="jmir_v27i1e71786_app3.docx" xlink:title="DOCX File, 36 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Implementation details of the convolutional long short-term memory framework for the percentage of influenza-like illness.</p><media xlink:href="jmir_v27i1e71786_app4.docx" xlink:title="DOCX File, 20 KB"/></supplementary-material><supplementary-material id="app5"><label>Multimedia Appendix 5</label><p>Shapley Additive Explanations analysis.</p><media xlink:href="jmir_v27i1e71786_app5.docx" xlink:title="DOCX File, 55 KB"/></supplementary-material><supplementary-material id="app6"><label>Multimedia Appendix 6</label><p>Derivation process and results of Big-O complexity estimation.</p><media xlink:href="jmir_v27i1e71786_app6.docx" xlink:title="DOCX File, 21 KB"/></supplementary-material><supplementary-material id="app7"><label>Multimedia Appendix 7</label><p>Convergence analysis for all-time period.</p><media xlink:href="jmir_v27i1e71786_app7.docx" xlink:title="DOCX File, 3327 KB"/></supplementary-material></app-group></back></article>