<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v26i1e48324</article-id>
      <article-id pub-id-type="pmid">38386404</article-id>
      <article-id pub-id-type="doi">10.2196/48324</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Identifying the Risk Factors of Allergic Rhinitis Based on Zhihu Comment Data Using a Topic-Enhanced Word-Embedding Model: Mixed Method Study and Cluster Analysis</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Liu</surname>
            <given-names>Xuan</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Cao</surname>
            <given-names>Yuanyuan</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Gu</surname>
            <given-names>Dongxiao</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>School of Management, Hefei University of Technology</institution>
            <addr-line>193 Tunxi Road</addr-line>
            <addr-line>Hefei, 230009</addr-line>
            <country>China</country>
            <phone>86 13866167367</phone>
            <email>gudongxiao@hfut.edu.cn</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3557-009X</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Qin</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0008-1154-8596</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Chai</surname>
            <given-names>Yidong</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0260-7589</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Xuejie</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8258-7030</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Zhao</surname>
            <given-names>Wang</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7453-9226</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Min</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0001-4724-1763</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Zolotarev</surname>
            <given-names>Oleg</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6917-9668</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>Zhengfei</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-4309-8371</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Gongrang</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0000-5494-366X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>School of Management, Hefei University of Technology</institution>
        <addr-line>Hefei</addr-line>
        <country>China</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Russian New University</institution>
        <addr-line>Moscow</addr-line>
        <country>Russian Federation</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Dongxiao Gu <email>gudongxiao@hfut.edu.cn</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>22</day>
        <month>2</month>
        <year>2024</year>
      </pub-date>
      <volume>26</volume>
      <elocation-id>e48324</elocation-id>
      <history>
        <date date-type="received">
          <day>19</day>
          <month>4</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>12</day>
          <month>10</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>30</day>
          <month>10</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>3</day>
          <month>1</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Dongxiao Gu, Qin Wang, Yidong Chai, Xuejie Yang, Wang Zhao, Min Li, Oleg Zolotarev, Zhengfei Xu, Gongrang Zhang. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 22.02.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2024/1/e48324" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Allergic rhinitis (AR) is a chronic disease, and several risk factors predispose individuals to the condition in their daily lives, including exposure to allergens and inhalation irritants. Analyzing the potential risk factors that can trigger AR can provide reference material for individuals to use to reduce its occurrence in their daily lives. Nowadays, social media is a part of daily life, with an increasing number of people using at least 1 platform regularly. Social media enables users to share experiences among large groups of people who share the same interests and experience the same afflictions. Notably, these channels promote the ability to share health information.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to construct an intelligent method (TopicS-ClusterREV) for identifying the risk factors of AR based on these social media comments. The main questions were as follows: How many comments contained AR risk factor information? How many categories can these risk factors be summarized into? How do these risk factors trigger AR?</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>This study crawled all the data from May 2012 to May 2022 under the topic of <italic>allergic rhinitis</italic> on Zhihu, obtaining a total of 9628 posts and 33,747 comments. We improved the Skip-gram model to train topic-enhanced word vector representations (TopicS) and then vectorized annotated text items for training the risk factor classifier. Furthermore, cluster analysis enabled a closer look into the opinions expressed in the category, namely gaining insight into how risk factors trigger AR.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Our classifier identified more comments containing risk factors than the other classification models, with an accuracy rate of 96.1% and a recall rate of 96.3%. In general, we clustered texts containing risk factors into 28 categories, with season, region, and mites being the most common risk factors. We gained insight into the risk factors expressed in each category; for example, seasonal changes and increased temperature differences between day and night can disrupt the body’s immune system and lead to the development of allergies.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our approach can handle the amount of data and extract risk factors effectively. Moreover, the summary of risk factors can serve as a reference for individuals to reduce AR in their daily lives. The experimental data also provide a potential pathway that triggers AR. This finding can guide the development of management plans and interventions for AR.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>social media platforms</kwd>
        <kwd>disease risk factor identification</kwd>
        <kwd>chronic disease management</kwd>
        <kwd>topic-enhanced word embedding</kwd>
        <kwd>text mining</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Over the past few decades, the prevalence of chronic diseases has increased significantly, becoming a global public health concern. The World Health Organization has listed allergic diseases as one of the disease types that require priority research and prevention in the 21st century [<xref ref-type="bibr" rid="ref1">1</xref>]. As a common chronic disease, allergic rhinitis (AR) is a multifactorial disease that is induced by environmental conditions or certain genes [<xref ref-type="bibr" rid="ref2">2</xref>]. AR not only has a significant impact on individuals’ sleep, social life, and work attendance but also triggers comorbidities such as conjunctivitis, atopic dermatitis, and asthma [<xref ref-type="bibr" rid="ref3">3</xref>]. Large-scale flow survey data showed that AR currently affects several people in China alone [<xref ref-type="bibr" rid="ref4">4</xref>] and with an estimated prevalence between 15% and 20% worldwide [<xref ref-type="bibr" rid="ref5">5</xref>]. The direct and indirect costs associated with the management of AR are also a significant burden on society. For instance, the total cost of AR in Sweden, with a population of 9.5 million, was estimated at €1.3 (US $1.41) billion annually [<xref ref-type="bibr" rid="ref6">6</xref>]. These unexpectedly high costs could be related to the high prevalence of disease, in combination with the previously often underestimated indirect costs that arise from reduced work efficiency and absenteeism and the potential costs associated with treating AR comorbidities [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
        <p>Currently, there is no cure for AR, and individuals need to avoid the disease risk factors such as exposure to allergens and inhalation irritants [<xref ref-type="bibr" rid="ref7">7</xref>] during the long self-management process. Therefore, identifying AR risk factors can provide a reference for patients to help reduce the condition in their daily lives [<xref ref-type="bibr" rid="ref8">8</xref>].</p>
        <p>A plethora of studies have been proposed to identify AR risk factors. These studies recruited participants with symptoms of AR and control participants without AR symptoms from a specific age group or a particular geographical area. These studies collected demographic information, lifestyle habits, family history, comorbidities, and residential areas through questionnaires. Subsequently, they used correlation methods to explore the relationship between these data and AR, aiming to identify the risk factors for AR within the specified age group or geographical area [<xref ref-type="bibr" rid="ref9">9</xref>]. However, these studies have 2 limitations. First, these studies specifically target certain age groups or geographical areas, and questionnaires can only gather data on specific pieces of information. Owing to the constraints of questionnaire surveys, it is challenging to identify potential risk factors that may be present in individuals’ daily lives. As a result, the risk factors identified through survey-based studies have a limited scope and are incomplete. As such, they provide limited insights for a broader patient population. Second, the survey-based approach demands a commitment to long-term investigation and a substantial effort to collect representative responses [<xref ref-type="bibr" rid="ref10">10</xref>]. In contrast, collecting information from social media platforms can cover large geographical areas at a comparatively low cost [<xref ref-type="bibr" rid="ref10">10</xref>]. Social media platforms allow users to share experiences and opinions on various topics [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>], including personal health issues [<xref ref-type="bibr" rid="ref13">13</xref>]. Over time, highly unstructured and implicit knowledge has been generated in communities where users frequently participate [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>], which can provide daily health records that are difficult to obtain from traditional questionnaire surveys. Therefore, social media can become a potential source of information for identifying risk factors for diseases such as AR [<xref ref-type="bibr" rid="ref16">16</xref>].</p>
        <p>Text-mining techniques are an effective tool for using voluminous social media data [<xref ref-type="bibr" rid="ref17">17</xref>]. Some studies have combined social media data analysis to obtain knowledge about disease risk factors [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. However, the abovementioned studies on disease risk factors used only shallow text features such as the number of social media text items and word cooccurrences, which are not conducive to identifying disease risk factors in the context of colloquial and diverse user expressions [<xref ref-type="bibr" rid="ref20">20</xref>]. In this study, we designed a text-processing framework to automatically identify risk factors from social media data [<xref ref-type="bibr" rid="ref21">21</xref>]. We used social media comments to construct a natural language processing–based AR risk factor identification method, aiming to tackle the problems of omission and low accuracy in traditional disease-related information identification methods that rely solely on shallow text features such as word frequency.</p>
        <p>To be more specific, we developed an AR risk factor identification method that integrates pretrained word embeddings with text convolutional neural networks (CNNs). The Word2vec algorithm has proven to be superior in text vector representation [<xref ref-type="bibr" rid="ref20">20</xref>]. This is a prediction-based approach that predicts the neighboring words that are most likely to appear within a window size around a center word in a corpus, resulting in high-dimensional vector representations that capture semantic aggregation. As social media users may mention related topics, such as symptoms and treatments, when describing risk factors in their comments, we used a local context window to achieve better semantic aggregation of AR risk factors, a method that has been demonstrated to be effective for such aggregation. In addition, using the Skip-gram model to train word pairs enables the incorporation of word thematic information, thus improving attention to risk factor phrases. The convolutional network can convolve the text in the word vector dimension and extract critical information through the max-pooling layer operation. In addition, this study used a clustering method with review mechanisms to concentrate on a large amount of text that contains risk factors within the observable range, thereby ensuring the usefulness of the content obtained through text mining.</p>
        <p>Our main contributions were as follows:</p>
        <list list-type="order">
          <list-item>
            <p>First, this study proposed a framework (TopicS-ClusterREV) based on natural language processing for identifying the risk factors of AR. We used pretrained word embeddings and text convolutional networks to process social media text. Our model can identify more risk factors from social media comments with high accuracy and recall. To the best of our knowledge, this is the first study to use natural language processing techniques to identify risk factors for AR in social media comments.</p>
          </list-item>
          <list-item>
            <p>Second, this study proposes a topic-enhanced word-embedding model. TopicS enhances the thematic information of words by adding a task that predicts the theme to which the center word belongs. This generates high-dimensional word vector representations with semantic aggregation and theme enhancement. We trained 2 types of word vectors using both the Skip-gram and TopicS models and separately input them into each risk factor classifier. The results showed that TopicS outperformed the baseline on the text classification task, demonstrating the effectiveness of our topic-enhanced word-embedding model.</p>
          </list-item>
          <list-item>
            <p>Finally, we introduced automatic and manual review mechanisms to improve the single-pass algorithm, which allowed us to effectively identify and focus on a large amount of text that contains risk factors within the observable range. We ultimately identified 28 categories of risk factors including the common risk factors that lead to most individuals developing symptoms and previously overlooked risk factors that were not within the scope of previous research.</p>
          </list-item>
        </list>
      </sec>
      <sec>
        <title>Identification of AR Risk Factors Through Surveys</title>
        <p>AR has become a major global issue with a substantial increase in its prevalence in recent years. In Europe, the prevalence of AR among Danish adults progressively increased from 19% to 32% over the past 3 decades [<xref ref-type="bibr" rid="ref22">22</xref>]. Understanding the risk factors, such as genetic, environmental, and lifestyle factors, helps in the management of AR, thus motivating many studies to focus on identifying potential risk factors. These studies are summarized in <xref ref-type="table" rid="table1">Table 1</xref>. From <xref ref-type="table" rid="table1">Table 1</xref>, we observed that the previous studies were based on survey methods, including cross-sectional surveys, cohort studies, and case-control studies.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Summary of the literature related to risk factors for allergic rhinitis (AR)<sup>a</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="300"/>
            <col width="200"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Study, year</td>
                <td>Method</td>
                <td>Risk factors</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Chiang et al [<xref ref-type="bibr" rid="ref23">23</xref>], 2016</td>
                <td>Case control</td>
                <td>Exposure to sulfur dioxide</td>
              </tr>
              <tr valign="top">
                <td>Kurganskiy et al [<xref ref-type="bibr" rid="ref24">24</xref>], 2021</td>
                <td>Cross-sectional</td>
                <td>Grass and tree pollen</td>
              </tr>
              <tr valign="top">
                <td>Lee et al [<xref ref-type="bibr" rid="ref25">25</xref>], 2021</td>
                <td>Cross-sectional</td>
                <td>The widespread use of industrial chemicals</td>
              </tr>
              <tr valign="top">
                <td>Paciência et al [<xref ref-type="bibr" rid="ref26">26</xref>], 2020</td>
                <td>Cross-sectional</td>
                <td>Indoor decoration materials containing volatile organic chemicals</td>
              </tr>
              <tr valign="top">
                <td>Saulyte et al [<xref ref-type="bibr" rid="ref27">27</xref>], 2014</td>
                <td>Case control</td>
                <td>Active smoking</td>
              </tr>
              <tr valign="top">
                <td>Kong et al [<xref ref-type="bibr" rid="ref28">28</xref>], 2021</td>
                <td>Cohort</td>
                <td>Stress</td>
              </tr>
              <tr valign="top">
                <td>Han et al [<xref ref-type="bibr" rid="ref29">29</xref>], 2016</td>
                <td>Cross-sectional</td>
                <td>Obesity</td>
              </tr>
              <tr valign="top">
                <td>Kanazawa et al [<xref ref-type="bibr" rid="ref30">30</xref>], 2018</td>
                <td>Cross-sectional</td>
                <td>TYRO3 gene</td>
              </tr>
              <tr valign="top">
                <td>Alm et al [<xref ref-type="bibr" rid="ref31">31</xref>], 2014</td>
                <td>Cross-sectional</td>
                <td>Using antibiotics in the first week after birth</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>We searched for the literature related to AR risk factors and presented 9 papers from the past decade to showcase the methods and the identified risk factors.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>These studies typically recruited participants with symptoms of AR and control participants without AR symptoms from a specific age group or a particular geographical area, collected demographic information through questionnaires, and then conducted correlation analysis, such as logistic regression, to explore the relationship between those metadata and AR [<xref ref-type="bibr" rid="ref32">32</xref>]. For instance, Gao et al [<xref ref-type="bibr" rid="ref9">9</xref>] conducted a cross-sectional survey to investigate the prevalence and risk factors of adult self-reported AR in the plain lands and hilly areas of Shenmu City in China and analyzed the differences between regions. The content of the web-based questionnaire included demographic factors, smoking status, the comorbidities of other allergic disorders, family history of allergies, and place of residence. The unconditional logistic regression analysis was used to screen for factors influencing AR. Finally, they found that the prevalence of AR existed in regional differences. Genetic and environmental factors were the important risk factors associated with AR. However, these studies have 2 limitations. First, these studies specifically targeted certain age groups or geographical areas, and questionnaires can only gather data on specific pieces of information. Owing to the constraints of questionnaire surveys, it is challenging to identify potential risk factors that may be present in individuals’ daily lives. As a result, the risk factors identified through survey-based studies have limited scope and are incomplete and they may provide limited insights for a broader patient population. Second, the survey-based approach demands a commitment to long-term investigation and a massive effort to collect representative responses [<xref ref-type="bibr" rid="ref10">10</xref>].</p>
      </sec>
      <sec>
        <title>Identification of Disease Risk Factors From Social Media Through Text Mining</title>
        <p>Social media sites provide a convenient way for users to continuously update their day-to-day activities, which allows large groups of people to create and share information, opinions, and experiences about health conditions through web-based discussion [<xref ref-type="bibr" rid="ref11">11</xref>]. Hence, social media can be considered a new data source to assess population health. As shown in <xref ref-type="table" rid="table2">Table 2</xref>, some studies have combined text-mining techniques to classify and summarize voluminous social media data to obtain knowledge about chronic disease risk factors. Zhang and Ram [<xref ref-type="bibr" rid="ref33">33</xref>] extracted behavioral features from Twitter posts of asthma users using keywords from an existing knowledge base. Griffis et al [<xref ref-type="bibr" rid="ref34">34</xref>] collected 25,000 tweets containing and not containing diabetes, identified 5000 common words, used logistic regression to determine which common words were high-frequency expressions of diabetes, and finally grouped these high-frequency words using latent Dirichlet allocation to obtain the risk factors for diabetes. Schäfer et al [<xref ref-type="bibr" rid="ref35">35</xref>] used syntactic analysis to identify portions of risk factors occurring before or after causal terms, grouped these portions using latent Dirichlet allocation, and obtained the risk factors for gastric discomfort. Pradeepa et al [<xref ref-type="bibr" rid="ref19">19</xref>] performed clustering on stroke-related tweets using the Probability Neural Network, used the Apriori algorithm to identify frequent word sets related to risk, and thus identified risk factors for stroke [<xref ref-type="bibr" rid="ref19">19</xref>]. In addition to the aforementioned approaches that use shallow text features such as keywords, frequent word sets, high-frequency words, and syntactic features for disease risk factor identification, other studies [<xref ref-type="bibr" rid="ref36">36</xref>-<xref ref-type="bibr" rid="ref38">38</xref>] trained risk factor classifiers using machine learning methods such as Naive Bayes, Maximum Entropy Model, and Naive Bayes Classifier–Term Frequency Inverse Document Frequency. These classifiers predict the presence of risk factors in text based on discrete vector representations such as bag-of-words and n-gram.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Summary of the literature related to disease risk factors based on social media data<sup>a</sup>.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="140"/>
            <col width="170"/>
            <col width="110"/>
            <col width="140"/>
            <col width="140"/>
            <col width="130"/>
            <col width="170"/>
            <thead>
              <tr valign="top">
                <td>Study, year</td>
                <td>Social media platforms</td>
                <td>Data</td>
                <td>Methods</td>
                <td>Features</td>
                <td>Diseases</td>
                <td>Identified risk factors</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Zhang and Ram [<xref ref-type="bibr" rid="ref33">33</xref>], 2020</td>
                <td>Twitter</td>
                <td>Posts</td>
                <td>Semisupervised learning</td>
                <td>Knowledge base</td>
                <td>Asthma</td>
                <td>Behavioral attributes</td>
              </tr>
              <tr valign="top">
                <td>Griffis et al [<xref ref-type="bibr" rid="ref34">34</xref>], 2020</td>
                <td>Twitter</td>
                <td>Posts</td>
                <td>LDA<sup>b</sup></td>
                <td>Word frequency</td>
                <td>Diabetes</td>
                <td>BMI, waist, drugs, alcohol, and obesity</td>
              </tr>
              <tr valign="top">
                <td>Schäfer et al [<xref ref-type="bibr" rid="ref35">35</xref>], 2020</td>
                <td>Doctissimo, Aufeminin</td>
                <td>Answers</td>
                <td>LDA</td>
                <td>Syntactic</td>
                <td>Gastrointestinal discomfort</td>
                <td>Food and psychological factors</td>
              </tr>
              <tr valign="top">
                <td>Pradeepa et al [<xref ref-type="bibr" rid="ref19">19</xref>], 2020</td>
                <td>Twitter</td>
                <td>Posts</td>
                <td>A priori</td>
                <td>Frequent word set</td>
                <td>Stroke</td>
                <td>Lifestyle, family history, heart disease</td>
              </tr>
              <tr valign="top">
                <td>Alswedani et al [<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                <td>Twitter</td>
                <td>Posts</td>
                <td>Keywords list</td>
                <td>Word frequency</td>
                <td>Psychological health</td>
                <td>Social and economic factors, individual factors, diseases and disorders</td>
              </tr>
              <tr valign="top">
                <td>Chung et al [<xref ref-type="bibr" rid="ref40">40</xref>]</td>
                <td>Telegram (app)</td>
                <td>Time</td>
                <td>MLP<sup>c</sup></td>
                <td>Meta data</td>
                <td>Respiratory diseases</td>
                <td>Pollution</td>
              </tr>
              <tr valign="top">
                <td>Neisani Samani et al [<xref ref-type="bibr" rid="ref41">41</xref>]</td>
                <td>Twitter</td>
                <td>Posts</td>
                <td>Content analysis methods</td>
                <td>Word frequency</td>
                <td>Oropharyngeal cancer</td>
                <td>Drinking, smoking</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>We searched for studies related to identifying disease risk factors based on social media data. We found 7 papers from the past decade, highlighting the social media platforms, data, methods, features, diseases, and risk factors involved in research.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>LDA: latent Dirichlet allocation.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>MLP: multilayer perceptron.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>The current methods for identifying disease risk factors on social media fall into 2 categories: shallow text feature methods and discrete word vector representations. Shallow text feature techniques often fail to capture important risk factors resulting in low accuracy, whereas discrete word vector approaches struggle to keep up with the dynamic vocabulary of social media text, missing new words, and trending expressions, thus inadequately representing the information conveyed.</p>
      </sec>
      <sec>
        <title>Word Embedding and Text Classification Based on Deep Learning</title>
        <p>Natural language processing technology promotes text analysis based on social media comments [<xref ref-type="bibr" rid="ref39">39</xref>]; this technology can learn the deeper semantic features of the comment text and the features that are consistent with the current context, according to different training corpus, to input a better text vector representation for downstream classification tasks. Some researchers have used large-scale pretrained language models [<xref ref-type="bibr" rid="ref40">40</xref>], global matrix decomposition [<xref ref-type="bibr" rid="ref41">41</xref>], and local context windows [<xref ref-type="bibr" rid="ref42">42</xref>] for text vector representation. Local context windows are more suitable for semantically aggregating AR risk factors [<xref ref-type="bibr" rid="ref43">43</xref>]. Skip-gram and Continuous Bag-of-Words Model (CBOW) are prediction-based methods that learn the semantic representation of a center word by predicting the most likely neighboring words within a window size in a corpus. When users narrate risk factors in their comments, they may also mention symptoms, treatments, and other topics. These global contexts may dilute the key features of the risk factors expression. CBOW averages the context words to predict the target word and tends to predict high-frequency words in the corpus. In contrast, Skip-gram gives each word a chance to be a center word, making it better at predicting rare words compared with CBOW [<xref ref-type="bibr" rid="ref44">44</xref>]. Therefore, in situations where social media users express a wide variety of ideas, the Skip-gram model can yield satisfactory outcomes. Moreover, the Skip-gram approach uses word pair training, which facilitates the incorporation of topic information into words [<xref ref-type="bibr" rid="ref45">45</xref>], resulting in the generation of high-dimensional word vectors that feature semantic aggregation and topic enhancement. Therefore, we selected Skip-gram as the word-embedding model for our study.</p>
        <p>Text classification has evolved to deep learning models, mainly including CNN-based models [<xref ref-type="bibr" rid="ref46">46</xref>], recurrent neural network (RNN)–based models [<xref ref-type="bibr" rid="ref47">47</xref>], and transformer models [<xref ref-type="bibr" rid="ref48">48</xref>]. For the CNN algorithm, convolutional networks can convolve text on the word vector dimensions and extract key information through pooling layer operations. Consequently, this algorithm is capable of using essential data for classification tasks. Therefore, we used TextCNN for classifier training and evaluated the performance of RNN and transformer models on this task.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Framework</title>
        <p>The framework used in this study consisted of 3 parts as shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>. The first part was data collection and processing, aimed at obtaining a clean data set. The second part was risk factor identification, which included the proposed TopicS method and training of a risk factor classifier. The implementation steps were as follows: (1) semiautomatically constructing a risk factor topic dictionary, (2) generating high-dimensional word vectors enhanced by TopicS-generated topics, and (3) vectorizing annotated text and training a risk factor classifier. The third part is text clustering and keyword extraction, which uses the ClusterREV method to cluster the identified risk factors and extract keywords from every category.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Allergic rhinitis (AR) risk factor identification method based on the topic-enhanced word-embedding model (TopicS-ClusterREV). The figure shows the research framework of our study. The framework consists of 3 parts. The first part is data collection and processing aimed at obtaining a clean data set. The second part is risk factor identification, which includes the proposed TopicS method and training of a risk factor classifier. The third part is text clustering and keyword extraction, which uses the ClusterREV method to cluster identified risk factors and extract keywords from every category.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e48324_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Data Set</title>
        <p>Zhihu is a Chinese social media platform where people discuss topics in an web-based forum format. In May 2022, the Zhihu subcommunity <italic>allergic rhinitis</italic> had 1.04 million discussions. The posts on this social media platform allow other users to comment [<xref ref-type="bibr" rid="ref49">49</xref>], and people can explain their situations to provide support or seek help effectively. Therefore, these comments provide a rich source of data for investigating the risk factors reported by different users [<xref ref-type="bibr" rid="ref50">50</xref>]. In this study, we trained domain-specific word representations based on experimental data. A relatively domain-specific input corpus [<xref ref-type="bibr" rid="ref51">51</xref>] is better at extracting meaningful semantic relations than a generic pretrained language model [<xref ref-type="bibr" rid="ref52">52</xref>]. We crawled all the data from May 2012 to May 2022 under the topic <italic>allergic rhinitis</italic> on Zhihu, obtaining a total of 9628 posts and 33,747 comments, including the post ID, comment ID, and post and comment content.</p>
        <p>In this study, we preprocessed the data through regularization, stop word removal, and word separation. First, we removed special symbols, such as URLs and emoticons, in the comments through regularization and stop word removal to reduce the interference of noise with the text analysis task. Then, we compiled a dictionary of 169 specialized terms, including types of AR, medications, and comorbidities, to reduce the probability of incorrect word segmentation. After word separation, we obtained a lexicon of 68,863 words and ranked the words according to the number of occurrences. We found that the top 10,000 words accounted for 94.83% of the total words, suggesting that many words recurred and a relatively simple word vector could effectively train the model [<xref ref-type="bibr" rid="ref53">53</xref>]. This further confirms the efficacy of our decision to use Skip-gram as the foundational model.</p>
        <p>We observed ultrashort comment noise in the comments (eg, “Thank you!”). It is important to note that these ultrashort comments do not include any personal medical information. The ultrashort comments were filtered, resulting in 33,039 valid comments. This operation can effectively minimize the impact of noise on downstream text classification tasks. Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> presents the examples of valid comments.</p>
      </sec>
      <sec>
        <title>Annotation</title>
        <p>The data must be labeled before supervised learning and then trained end to end. If a comment directly mentions an allergen or indicates a condition that leads to the appearance or worsening of symptoms, the comment will be labeled as 1, indicating the presence of risk factors, as shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Examples of short text annotation. The figure shows examples of data labeled as 1 including the text and label. In the figure, phrases with a blue background indicate those that were specifically noted during manual annotation, and the presence of these marker phrases often suggests potential risk factors in the sentence. The yellow background highlights the risk factors in the text.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e48324_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>We randomly chose 2030 comments from the 33,039 comments, and 3 researchers labeled each comment as containing or not containing risk factors. To ensure high interannotator consistency, all 3 researchers annotated all 2030 comments. In cases with uncertainty in labeling, the 3 researchers discussed and arrived at a final label. After annotating and eliminating comments with religiously controversial content, 2000 labeled comments remained, consisting of 996 comments containing risk factors and 1004 comments not containing risk factors. The data set was divided into a 90% training set and a 10% test set. The 90% training set was further divided into 10 subsets, with 9 subsets used for training and the remaining subset used for validation, performing 10-fold cross-validation.</p>
      </sec>
      <sec>
        <title>Topic Dictionary Construction</title>
        <p>We used a combination of manual labeling and similarity calculation to identify keywords related to risk factors. Subsequently, we constructed a table of topic words using a semiautomated approach. The process of constructing the dictionary is depicted in <xref ref-type="boxed-text" rid="box1">Textbox 1</xref> and is as follows: (1) label 400 randomly selected comments as described in the <italic>Annotation</italic> section, thereby obtaining 198 comments with risk factors; (2) extract risk factor phrases from annotated comments; (3) obtain risk factors topic word list; (4) remove duplicate word list, and the words in the current topic are used as seed words, <italic>word_set</italic>; (5) use Skip-gram to find the top similar words to expand the topic words; (6) repeat steps 3 through 5 to expand the topic word; and (7) finally, obtain the topic words for the risk factor. A large weight was assigned to the risk factor theme words. Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> shows examples of the risk factor topic dictionary.</p>
        <boxed-text id="box1" position="float">
          <title>The algorithm for building the topic dictionary. This textbox outlines the algorithm process for building the topic dictionary with explanations for each step provided in the text.</title>
          <p>Input: annotated comments</p>
          <p>Output: topic dictionary</p>
          <p>1. d<sup>i</sup>= Select Annotated data;</p>
          <p>2. p<sup>i</sup>= Extract from d<sup>i</sup></p>
          <p>3. list =</p>
          <p>for w in p<sup>i</sup>:</p>
          <p>list_i.append(w)</p>
          <p>4. word_set=set(list)</p>
          <p>5. for w in set: word_i.update(Skip-gram.mostsimilar(topn=n))</p>
          <p>6. Loop step3, step4, step5</p>
        </boxed-text>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>As the use of text data from social media involves user privacy, this study adopted the following steps for deidentification: (1) We removed user account information and retained only anonymous comment information. (2) We used regular expressions to match and delete URLs and email addresses in the comments. (3) During the annotation process, annotators received only text that did not involve personal information. To evaluate the quality of deidentification, we randomly selected 500 text items for manual inspection and did not find any instances containing personal identity information. Our data are sourced from public discussions on Zhihu, a social media platform that can be accessed without registration. We followed strict ethical research protocols similar to the guidelines by Eysenbach and Till [<xref ref-type="bibr" rid="ref54">54</xref>]. In addition, to protect the anonymity of participants, we have implemented measures including the removal of user information and avoiding verbatim quotations to prevent identification through search engines, protecting the privacy and security of personal data. It should be mentioned that our study was focused on the post level; we do not anticipate any negative ethical impact from our analysis.</p>
      </sec>
      <sec>
        <title>Topic-Enhanced Word Embedding</title>
        <p>TopicS performed 2 tasks during training, as shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>. The first task was to predict the neighboring words within the window of the central word. The second task was to predict the topic of the central word; the topic dictionary used for this purpose is described in the <italic>Topic Dictionary Construction</italic> section.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Topic-enhanced word-embedding model (TopicS). The figure illustrates the vector changes within the TopicS model. The rectangular boxes in both the input and output represent one-hot vectors. Within the input, the dark blue circles signify the center words, representing a value of 1, whereas the light blue circles denote other words in the training text, with a value of 0. For the output’s task 1, the dark blue circles depict context words surrounding the center word, signifying a value of 1, whereas the light blue circles represent noncontext words with a value of 0. The various colored circles in the output’s task 2 indicate the topics to which the center word belongs. If it pertains to the risk factor topic, it is marked by a dark blue circle, symbolizing a value of 1, whereas circles of other colors represent a value of 0.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e48324_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>The specific formula calculations for the loss function design, parameter updates, and error backpropagation of TopicS are explained subsequently.</p>
        <p>First, we defined the loss function. For each word in the corpus, we used it as the central word for a sliding operation with a window size of <italic>c</italic>; let <italic>S</italic> be the training sequence (<italic>w<sub>1</sub>,w<sub>2</sub>,...,w<sub>T</sub></italic>), whereas <italic>w<sub>i</sub></italic> denotes the <italic>i</italic>th word in the sequence. The subscript <italic>T</italic> represents the total number of unique words in the corpus. In addition to predicting the contextual word of the central word, we must also predict the topic score of the central word. Therefore, the loss function comprised 2 parts: <italic>L<sub>cont</sub></italic> and <italic>L<sub>topic</sub></italic>, and the overall loss was denoted by <italic>L<sub>s</sub></italic>. Our training objective was to minimize the loss function:</p>
        <disp-formula>
          <graphic xlink:href="jmir_v26i1e48324_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </disp-formula>
        <p>The initial word vector was represented as one-hot vector. The central word was denoted as <italic>w<sub>center</sub></italic>, the surrounding words of the central word were denoted as <italic>w<sub>(O,cont(i))</sub></italic>, and the central word topic information was denoted as <italic>w<sub>(O,topic)</sub></italic>. The weight parameter <italic>λ</italic> was used to balance the loss of <italic>L<sub>cont</sub></italic> and <italic>L<sub>topic</sub></italic>. After sliding the window to browse the entire corpus to average all loss window losses, error backpropagation was performed to update the parameters. The input matrix was represented as the central word vector. The actual loss function can be expressed as <graphic xlink:href="jmir_v26i1e48324_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/></p>
        <p>Second, we introduced the rules for updating parameters. The parameters were updated through error backpropagation <graphic xlink:href="jmir_v26i1e48324_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/> Here, <italic>y<sub>true</sub></italic> represents the true value of the contextual words in the window, and <italic>y<sub>pred</sub></italic> represents the predicted value.</p>
        <p>Finally, we can update the word representation.</p>
      </sec>
      <sec>
        <title>Text Classification</title>
        <p>In this study, we chose TextCNN as the classification model. In the risk factor identification task, some key semantic information is more important, and TextCNN can efficiently use the key information for classification with minimal cost consumption. We represented the manually annotated text as a vector matrix using high-dimensional word vector representations trained by the TopicS model, which aggregates local contextual and topic information and uses it as input for the TextCNN model. Then, the TextCNN algorithm leverages convolutional kernels of different sizes to extract multiple n-gram text features and uses convolutional operations in a fixed window to combine word representations to capture local information. Our input word vector combined the topic information of words, and the most important features in the convolution operation can be extracted using the maximum pooling operation as shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Framework of the classification model with different word embedding. This figure illustrates the TextCNN modeling process for text vectorization using both the skip-gram and TopicS techniques. In the example sentence, “spring” and “pollen” are highlighted as risk factors. These words are represented by blue squares in TopicS, suggesting that TopicS incorporates topic information, unlike the skip-gram method. These thematic data are subsequently integrated into the convolution, max-pooling, and softmax procedures to enhance the model’s classification capabilities.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e48324_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Clustering With a Review Mechanism</title>
        <p>The clustering task is to group similar risk factors. In this study, a large amount of text containing risk factors was clustered into a manually observable number of categories, making it easier to comprehend their content. This study enhances the single-pass algorithm and integrates it with a manual review to cluster the risk factors identified in the text classification, ensuring the validity of the clustering results. The main concept of single-pass clustering [<xref ref-type="bibr" rid="ref55">55</xref>] is to match informational text items based on their similarity values without the need to determine the number of clusters in advance. This makes it suitable for clustering tasks with an unknown number of clusters. However, traditional single-pass clustering uses only one-loop traversal, which may result in previously entered text items completing the traversal earlier. This can cause their similarity to the previous topics to be slightly lower than the threshold and lead to them being recreated as new categories, ultimately affecting the clustering effect.</p>
        <p>As shown in <xref rid="figure5" ref-type="fig">Figure 5</xref>, we improved the single-pass algorithm by retraversing the categories that were clustered separately after all the text items had been traversed to handle any missed text. After the automated clustering was completed, we conducted a manual review to ensure the reliability of the clustering.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Cluster method with review mechanisms (ClusterREV). This figure depicts the process of the ClusterREV algorithm. The rectangular boxes represent category state transitions. The circles below the rectangles indicate the texts awaiting clustering. The algorithm assesses the distance between the current text and existing categories, classifying the text based on the minimal distance and a set threshold. Once all texts have been clustered, texts within a solitary category undergo automatic review. Finally, we manually reviewed the clustering results.</p>
          </caption>
          <graphic xlink:href="jmir_v26i1e48324_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Moreover, this study uses a keyword cloud visualization of category content to quickly understand the themes and characteristics of each cluster and compare the differences between different clusters. TextRank [<xref ref-type="bibr" rid="ref56">56</xref>] was selected to extract category keywords, which considers only the voting scores of words in a single document; common words that frequently appear in a single document easily obtain high scores [<xref ref-type="bibr" rid="ref57">57</xref>]. We treated each category as a single document for keyword extraction. As risk factors appear more frequently in categories, TextRank can effectively extract risk factors and surrounding words, preserving category content information as much as possible and reflecting the true content of the risk factors.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overview</title>
        <p>In this section, we present the performance of the classifier and the findings based on the categorization of all the comments in the clean data set using the classifier. Our approach involved visualizing the clustering results of the risk factors to comprehend the primary elements of these factors. We also explored the pathogenic mechanisms associated with these risk factors.</p>
      </sec>
      <sec>
        <title>Classifier Performance</title>
        <p>We used standard text-mining evaluation metrics such as accuracy, precision, recall, and <italic>F</italic><sub>1</sub>-score to evaluate the performance. Precision assesses how many risk factors the model identifies correctly, and recall measures how many risk factors the model can identify on its test set. As we aimed to identify as many AR risk factors as possible to provide comprehensive references for individuals, recall was more important than precision in our study.</p>
        <p>We set 7-word embedding dimensions ranging from 100 to 400. <xref ref-type="table" rid="table3">Table 3</xref> displays the classification results of the TextCNN classification model with the 7 dimensions of Skip-gram and TopicS word vectors. In addition, TextRNN and transformer models were evaluated with the 7-word embedding dimensions of TopicS or Skip-gram, as shown in Tables S3 and S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>; the classification models performed better when the word-embedding dimension was 100 or 150, as shown in <xref ref-type="table" rid="table4">Table 4</xref>, which includes the results with best-performing dimensions. This study conducted word representation learning on a domain-specific input corpus, where low dimensionality was found to be sufficient to represent the features of the corpus [<xref ref-type="bibr" rid="ref58">58</xref>]. Moreover, TopicS not only improved precision but also significantly increased recall for all 3 models, as shown in <xref ref-type="table" rid="table4">Table 4</xref>.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Word-embedding dimension parameters with TextCNN.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="130"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="120"/>
            <col width="0"/>
            <col width="120"/>
            <col width="0"/>
            <col width="120"/>
            <col width="0"/>
            <col width="120"/>
            <col width="0"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Evaluation metrics and model</td>
                <td colspan="2">100</td>
                <td colspan="2">150</td>
                <td>200</td>
                <td colspan="3">250</td>
                <td colspan="2">300</td>
                <td colspan="2">350</td>
                <td>400</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="16">Accuracy (%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Skip-gram</td>
                <td colspan="2">93.75</td>
                <td colspan="2">94.85</td>
                <td colspan="3">94.00</td>
                <td>93.15</td>
                <td colspan="2">93.80</td>
                <td colspan="2">93.49</td>
                <td colspan="2">93.40</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TopicS<sup>a</sup></td>
                <td colspan="2">95.10<sup>b</sup></td>
                <td colspan="2">96.10</td>
                <td colspan="3">94.80</td>
                <td>94.45</td>
                <td colspan="2">94.95</td>
                <td colspan="2">95.25</td>
                <td colspan="2">95.40</td>
              </tr>
              <tr valign="top">
                <td colspan="16">Precision (%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Skip-gram</td>
                <td colspan="2">91.92</td>
                <td colspan="2">95.32</td>
                <td colspan="3">94.07</td>
                <td>93.16</td>
                <td colspan="2">93.33</td>
                <td colspan="2">93.28</td>
                <td colspan="2">93.09</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TopicS</td>
                <td colspan="2">96.32</td>
                <td colspan="2">95.95</td>
                <td colspan="3">95.56</td>
                <td>94.11</td>
                <td colspan="2">95.20</td>
                <td colspan="2">95.87</td>
                <td colspan="2">96.53</td>
              </tr>
              <tr valign="top">
                <td colspan="16">Recall (%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Skip-gram</td>
                <td colspan="2">94.00</td>
                <td colspan="2">94.50</td>
                <td colspan="3">94.00</td>
                <td>93.30</td>
                <td colspan="2">94.40</td>
                <td colspan="2">93.90</td>
                <td colspan="2">93.90</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TopicS</td>
                <td colspan="2">95.90</td>
                <td colspan="2">96.30</td>
                <td colspan="3">94.00</td>
                <td>94.90</td>
                <td colspan="2">94.70</td>
                <td colspan="2">94.60</td>
                <td colspan="2">94.20</td>
              </tr>
              <tr valign="top">
                <td colspan="16"><italic>F</italic><sub>1</sub>-score (%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Skip-gram</td>
                <td colspan="2">93.90</td>
                <td colspan="2">94.88</td>
                <td colspan="3">93.95</td>
                <td>93.17</td>
                <td colspan="2">93.84</td>
                <td colspan="2">93.48</td>
                <td colspan="2">93.44</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TopicS</td>
                <td colspan="2">95.09</td>
                <td colspan="2">96.10</td>
                <td colspan="3">94.77</td>
                <td>94.48</td>
                <td colspan="2">94.94</td>
                <td colspan="2">95.22</td>
                <td colspan="2">95.34</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>TopicS represents the topic-enhanced word-embedding model proposed in this paper.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>Italicization represents that the metrics of TopicS are better than Skip-gram for each metric.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Accuracy, precision, recall, and <italic>F</italic><sub>1</sub>-score of Skip-gram and TopicS with different classification models.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="200"/>
            <col width="0"/>
            <col width="160"/>
            <col width="0"/>
            <col width="160"/>
            <col width="0"/>
            <col width="150"/>
            <col width="150"/>
            <col width="0"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Model (Embed_size<sup>a</sup>)</td>
                <td colspan="2">Accuracy (%)</td>
                <td colspan="2">Precision (%)</td>
                <td>Recall (%)</td>
                <td colspan="2"><italic>F</italic><sub>1</sub>-score (%)</td>
                <td>Time (s)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="11">TextCNN</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Skip-gram (150 dimens)</td>
                <td colspan="2">94.85</td>
                <td colspan="2">95.32</td>
                <td colspan="2">94.50</td>
                <td>94.88</td>
                <td colspan="2">40.30</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TopicS (150 dimens)</td>
                <td colspan="2">96.10<sup>b</sup></td>
                <td colspan="2">95.94</td>
                <td colspan="2">96.30</td>
                <td>96.10</td>
                <td colspan="2">35.23</td>
              </tr>
              <tr valign="top">
                <td colspan="11">TextRNN</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Skip-gram (150 dimens)</td>
                <td colspan="2">94.85</td>
                <td colspan="2">95.32</td>
                <td colspan="2">94.50</td>
                <td>94.88</td>
                <td colspan="2">40.30</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TopicS (150 dimens)</td>
                <td colspan="2">96.10<sup>b</sup></td>
                <td colspan="2">95.94</td>
                <td colspan="2">96.30</td>
                <td>96.10</td>
                <td colspan="2">35.23</td>
              </tr>
              <tr valign="top">
                <td colspan="11">Transformer</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Skip-gram (100 dimens)</td>
                <td colspan="2">85.45</td>
                <td colspan="2">85.06</td>
                <td colspan="2">78.80</td>
                <td>81.13</td>
                <td colspan="2">55.16</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>TopicS (150 dimens)</td>
                <td colspan="2">90.70</td>
                <td colspan="2">90.90</td>
                <td colspan="2">90.60</td>
                <td>90.68</td>
                <td colspan="2">49.32</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>Embed_size represents the word-embedding size.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>Italicization represents that the metrics of TopicS are better than Skip-gram for each model.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p><xref ref-type="table" rid="table4">Table 4</xref> shows that TextCNN has the highest accuracy and recall rate among the 3 classification models. The highest accuracy achieved by our classification model was 0.9594, which used a 150-dimension word-embedding representation obtained from TopicS. In other words, TextCNN can detect more risk factors and minimize the loss of risk factors resulting from classification errors. The CNN model can extract key information similar to n-grams in sentences. The combination of TopicS and TextCNN can enhance topic information and achieve an aggregation effect. Our implementation process was the simplest and consumed the least resources. Our model examined 30,372 comments and identified 5221 comments containing risk factors.</p>
      </sec>
      <sec>
        <title>Risk Factor Clustering Results</title>
        <p>We clustered the text items obtained from the text classification into 28 categories and extracted keywords from each category to better understand the content. <xref ref-type="table" rid="table5">Table 5</xref> shows the top 5 categories and their corresponding keywords. The complete list can be found in Table S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. We used category 1 as an example to explain the category formation process and demonstrate the validity of the qualitative results. As shown in <xref ref-type="table" rid="table4">Table 4</xref>, we labeled category 1 as <italic>Season</italic> based on the analysis of keyword weights and relative comments. The comments related to this category focused on seasonally induced AR, with factors such as changes in the weather during seasonal transitions and colder temperatures during winter, which can exacerbate symptoms. We also counted the number of text items in each category and found that seasonal, regional, mites, and weather changes were common risk factors for most patients. In addition, patients’ unhealthy lifestyle habits were also important risk factors widely present in research investigations. Furthermore, most patients reported experiencing symptoms at specific times (eg, “morning”), but researchers have paid little attention to the timing of symptom occurrence (which we refer to as time points).</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Category keyword distribution and visualization.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="117"/>
            <col width="605"/>
            <col width="145"/>
            <col width="133"/>
            <thead>
              <tr valign="top">
                <td>Category</td>
                <td>Top 10 words (weight)</td>
                <td>Word cloud</td>
                <td>Number of text items</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Season</td>
                <td>Summer (0.031), winter (0.031), season (0.02), season change (0.014), spring (0.013), autumn (0.013), seasonal (0.013), nose (0.011), air conditioning (0.01), month (0.007)</td>
                <td>
                  <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>
                </td>
                <td>852</td>
              </tr>
              <tr valign="top">
                <td>Region</td>
                <td>Beijing (0.035), Shenzhen (0.019), air (0.010), Wuhan (0.010), Guangdong (0.01), city (0.009), Shanghai (0.009), dust mites (0.009), nose (0.009), university (0.009)</td>
                <td>
                  <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>
                </td>
                <td>644</td>
              </tr>
              <tr valign="top">
                <td>Mites</td>
                <td>Dust mites (0.111), mites (0.045), dust (0.02), allergy (0.012), pollen (0.008), allergens (0.007), effect (0.006), child (0.005), nose (0.005), cold air (0.005)</td>
                <td>
                  <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>
                </td>
                <td>608</td>
              </tr>
              <tr valign="top">
                <td>Weather</td>
                <td>Cold air (0.071), weather (0.023), temperature (0.021), nose (0.02), winter (0.009), changes (0.008), air (0.008), alternate (0.008), summer (0.007), air conditioning (0.007)</td>
                <td>
                  <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>
                </td>
                <td>538</td>
              </tr>
              <tr valign="top">
                <td>Other diseases</td>
                <td>Cold and flu (0.095), conjunctivitis (0.019), urticaria (0.016), nose (0.01), asthma (0.009), cough (0.008), eczema (0.008), winter (0.004), eyes (0.004), physique (0.004)</td>
                <td>
                  <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref>
                </td>
                <td>372</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>The Possible Pathway of Several Risk Factors Triggers AR</title>
        <p>We referred to the relevant literature on the risk factors associated with AR to confirm whether the extracted risk factors were consistent with the general medical consensus. Our findings are novel compared with those in the literature [<xref ref-type="bibr" rid="ref59">59</xref>]. Previous survey-based studies have explored only the correlation between risk factors and AR, whereas our experimental data provide insight into the potential pathogenesis of reported risk factors. The following section provides a theoretical discussion of potential pathways for several risk factors that trigger AR:</p>
        <list list-type="bullet">
          <list-item>
            <p><italic>Season</italic>: (1) seasonal risk factors are manifested in pollen allergens. Tree allergens such as elm and cypress pollen are prevalent in early spring, followed by ash, pine, and birch pollen in late spring. In summer, grasses, artemisia, and flowering plants grow vigorously owing to increased rainfall, leading to increased pollen spread from these plants. In autumn, weeds account for the largest proportion of pollen allergens. (2) Different climatic conditions in different seasons contribute to the development of allergies. For example, in early spring, frequent cold and high-pressure air activity in East Asia causes intense atmospheric circulation, resulting in alternating hot and cold temperatures that impair the immune regulatory function of the human body, leading to increased allergy attacks. In autumn, changeable weather, large temperature differences, and sunlight and UV radiation can stimulate allergic reactions in people with weak lungs or those who are prone to AR. In addition, seasonal changes and increasing temperature differences between day and night can disrupt the human immune system.</p>
          </list-item>
          <list-item>
            <p><italic>Poor habits</italic>: major keywords for this topic were “smoking,” “staying up late,” and “resistance.” (1) Habits such as staying up late, lack of exercise, smoking, and alcohol abuse can weaken immunity and resistance. Gangl et al [<xref ref-type="bibr" rid="ref60">60</xref>] found that smoking can reduce the integrity and barrier function of respiratory epithelial cells, thereby making smokers more susceptible to allergens. (2) An irregular diet can damage the spleen and stomach, which is also a key factor in the development of AR. (3) The frequent use of air conditioning in summer can cause nasal mucosa irritation owing to temperature fluctuations. Long-term exposure to adverse stimuli can cause dryness of the nasal cavity and weaken the resistance of the mucosal epithelium, which may lead to AR.</p>
          </list-item>
          <list-item>
            <p><italic>Allergens</italic>: we grouped clusters that included mites, plants, food, animals, and mold as allergens. (1) The findings of this study suggest that dust mites are the primary allergen, and exposure to a certain concentration of indoor dust mites can lead to AR. The ideal humidity level for dust mite growth is between 75% and 80%, and dust mites tend to thrive during spring and autumn and in warm and humid environments. Studies have shown that a large number of dust mites may be attached to uncleaned air conditioning filters, confirming that air conditioning is an important route of transmission for household dust mites [<xref ref-type="bibr" rid="ref61">61</xref>]. (2) Allergenic pollen species are closely related to regions and seasons, and some regions now provide pollen concentration and allergy index broadcasts based on meteorological conditions, which is highly convenient for individuals experiencing allergy. (3) Food allergens such as milk, eggs, wheat, soybeans, and peanuts can also trigger AR. (4) Apart from dust mites, other perennial indoor allergens include animal dander, cockroach excrement, and molds.</p>
          </list-item>
          <list-item>
            <p><italic>Outdoor environment</italic>: this topic had “dust,” “air quality,” “trust,” and “allergen” as high scoring words. (1) Various substances present in the outdoor environment can trigger AR. Industrialization has increased the content of aromatic hydrocarbon particles, ethanol, and formaldehyde in diesel exhaust, which can damage the mucous membrane and serve as a strong stimulus for AR attacks. (2) Air pollution can affect the distribution of allergens such as mold and pollen. In hazy weather, allergens tend to stay in the air longer, increasing the chance and duration of contact with the human body and leading to AR. (3) High winds can raise dust, pollen, mites, bacteria, and other allergenic factors, increasing their concentration in the air and making it easier to trigger AR.</p>
          </list-item>
          <list-item>
            <p><italic>Time points</italic>: patients with AR are more likely to experience symptoms during 2 specific time points, morning and evening. Schenkel et al [<xref ref-type="bibr" rid="ref62">62</xref>] assessed the severity of 4 nasal symptoms (sneezing, blockage, nasal runny nose, and nasal itch) at different times of the day, revealing that morning and evening symptoms were the most severe. This may be because of the circadian rhythm, pollen concentration, or personal behavior exacerbating the symptoms. In the evening, when the wind subsides, pollen settles closer to the ground and can be inhaled more easily. In addition, although humans rest at night in a horizontal position, nasal ventilation may be more difficult, leading to more severe symptoms. In the morning, low temperatures can cause congestion and swelling of the nasal mucosa because of the temperature difference between the environment and the body. This cluster had words such as “evening,” “get up early,” and “nose” as highly rated words.</p>
          </list-item>
        </list>
        <p>This theoretical discussion regarding the potential pathway of risk factors that trigger AR can guide the development of detailed AR intervention measures. For example, patients with AR can pay attention to pollen concentration and temperature changes and adjust their outings and clothing accordingly based on the characteristics of the season; they can set the air conditioner to turn on or off based on their waking time to reduce the inhalation of cold air when waking up. Furthermore, they can adjust their sleeping position to reduce the frequency of nighttime symptoms.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study aimed to identify the risk factors for AR based on social media comments. To do so, a data set of comments related to AR was collected, processed, and analyzed. The data set covered a consecutive period from May 2012 to May 2022. Overall, this analysis provided new insights into three main questions: (1) How many comments contained AR risk factor information? (2) How many categories can these risk factors be summarized into? (3) How do these risk factors trigger AR?</p>
        <p>In assessing the identification of AR risk factors, we found that TopicS enhanced both precision and recall. TextCNN outperformed other models, achieving an accuracy of 0.9594 with a 150-dimension TopicS embedding. Analyzing 30,372 comments, our model pinpointed 5221 comments with risk factors. Categorizing the text items led to 28 distinct categories, with seasonal factors, regional variations, mites, weather changes, and unhealthy lifestyle habits emerging as common risks.</p>
        <p>Furthermore, our research into AR risk factors revealed how risk factors trigger AR and uncovered the frequently reported, but underresearched, risk factors by affected individuals. Seasonal changes, especially during spring and autumn, increase exposure to pollen allergens, with varying climatic conditions affecting the development of allergies. Poor habits, such as smoking, irregular sleep, and frequent use of air conditioning, compromise immunity and heighten AR susceptibility. Dust mites, influenced by humidity, stand out as a primary allergen, with food items and indoor factors, such as animal dander, also triggering AR. Industrial pollutants and outdoor environmental factors amplify AR risk. Notably, AR symptoms intensify during mornings and evenings, which is likely influenced by circadian rhythms and environmental factors.</p>
      </sec>
      <sec>
        <title>Limitations and Future Work</title>
        <p>This study has some limitations. Our study was based on the self-reported nature of social media data, and the lack of more detailed information from the study participants was a concern. Our statistics showed that seasonal factors, regional variations, mites, weather changes, and unhealthy lifestyle habits emerge as common risk factors, which is consistent with the findings of other studies based on surveys. Although social media may lack in-depth patient information, it provides an effective method of collecting breadth of data. Social media data can be gathered 24 hours a day and are an extremely efficient way to rapidly update new knowledge into the risk factor knowledge base. In the future, our framework can be expanded in 2 ways. First, the framework can track the development trends and changes in AR risk factors by leveraging real-time internet data sets. Second, the framework can be generalized and extended to detect patterns, trends, and risk factors for other chronic diseases such as type 2 diabetes.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In this model improvement study, we proposed a topic-enhanced word-embedding model to improve the accuracy and recall of the text classification, namely to uncover less common or other types of risk factors based on social media data that have not been previously reported. The risk factors identified in this study can be a helpful reference for people with AR to reduce the development of the disease in their daily lives. This study establishes a knowledge base of potential risk factors for individuals who may not be aware of the factors that could trigger their symptoms. Patients can compare their lifestyle habits and medical history to identify their risk factors, which could help reduce the frequency of episodes and prevent the decline in their quality of life caused by blindly avoiding potential triggers. Our findings demonstrate the practicality and feasibility of using social media data for investigating disease knowledge. These findings may provide guidance for the development of management plans and interventions for AR.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Examples of social media text, topic dictionary examples, word-embedding dimension parameters with TextRNN, word-embedding dimension parameters with transformer, and social media category distribution and visualization.</p>
        <media xlink:href="jmir_v26i1e48324_app1.docx" xlink:title="DOCX File , 693 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Word cloud 1.</p>
        <media xlink:href="jmir_v26i1e48324_app2.png" xlink:title="PNG File , 119 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>Word cloud 2.</p>
        <media xlink:href="jmir_v26i1e48324_app3.png" xlink:title="PNG File , 120 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>Word cloud 3.</p>
        <media xlink:href="jmir_v26i1e48324_app4.png" xlink:title="PNG File , 122 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>Word cloud 4.</p>
        <media xlink:href="jmir_v26i1e48324_app5.png" xlink:title="PNG File , 121 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>Word cloud 5.</p>
        <media xlink:href="jmir_v26i1e48324_app6.png" xlink:title="PNG File , 111 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AR</term>
          <def>
            <p>allergic rhinitis</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">CBOW</term>
          <def>
            <p>Continuous Bag-of-Words Model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CNN</term>
          <def>
            <p>convolutional neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">RNN</term>
          <def>
            <p>recurrent neural network</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The data set collection and analysis of this research were partially supported by the National Natural Science Foundation of China (grants 72131006, 72071063, and 72271082); Anhui Provincial Key Research and Development Plan Project (grant 2022i01020003); and the Fundamental Research Funds for the Central Universities (grant JS2023ZSPY0063).</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The data sets generated and analyzed during this study are available from the corresponding author upon reasonable request.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>DG conceptualized and investigated the study. QW drafted the methodology, performed the software analysis, and prepared the original draft. YC reviewed and edited the draft. XY completed the investigation. WZ drafted the methodology and supervised the study. ML supervised the study. ZX conceptualized the study. GZ and ZO supervised the study.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pawankar</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Baena-Cagnani</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Bousquet</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Walter Canonica</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cruz</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Kaliner</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Lanier</surname>
              <given-names>BQ</given-names>
            </name>
            <name name-style="western">
              <surname>Henley</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>State of world allergy report 2008: allergy and chronic respiratory diseases</article-title>
          <source>World Allergy Org J</source>
          <year>2008</year>
          <volume>1</volume>
          <fpage>S4</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.1186/1939-4551-1-S1-S4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krishna</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Mahesh</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Vedanthan</surname>
              <given-names>PK</given-names>
            </name>
            <name name-style="western">
              <surname>Mehta</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Moitra</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Christopher</surname>
              <given-names>DJ</given-names>
            </name>
          </person-group>
          <article-title>The burden of allergic diseases in the Indian subcontinent: barriers and challenges</article-title>
          <source>Lancet Glob Health</source>
          <year>2020</year>
          <month>04</month>
          <volume>8</volume>
          <issue>4</issue>
          <fpage>e478</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2214-109X(20)30061-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S2214-109X(20)30061-9</pub-id>
          <pub-id pub-id-type="medline">32199115</pub-id>
          <pub-id pub-id-type="pii">S2214-109X(20)30061-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greiner</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Hellings</surname>
              <given-names>PW</given-names>
            </name>
            <name name-style="western">
              <surname>Rotiroti</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Scadding</surname>
              <given-names>GK</given-names>
            </name>
          </person-group>
          <article-title>Allergic rhinitis</article-title>
          <source>Lancet</source>
          <year>2011</year>
          <month>12</month>
          <day>17</day>
          <volume>378</volume>
          <issue>9809</issue>
          <fpage>2112</fpage>
          <lpage>22</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(11)60130-X</pub-id>
          <pub-id pub-id-type="medline">21783242</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(11)60130-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>XD</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lou</surname>
              <given-names>HF</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bo</surname>
              <given-names>MY</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>SQ</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bachert</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>An increased prevalence of self-reported allergic rhinitis in major Chinese cities from 2005 to 2011</article-title>
          <source>Allergy</source>
          <year>2016</year>
          <month>08</month>
          <day>13</day>
          <volume>71</volume>
          <issue>8</issue>
          <fpage>1170</fpage>
          <lpage>80</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26948849"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/all.12874</pub-id>
          <pub-id pub-id-type="medline">26948849</pub-id>
          <pub-id pub-id-type="pmcid">PMC5074323</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Price</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Hellings</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Papadopoulos</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Fokkens</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Muraro</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Chisholm</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Demoly</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Scadding</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Mullol</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lieberman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bachert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mösges</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ryan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bousquet</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Current controversies and challenges in allergic rhinitis management</article-title>
          <source>Expert Rev Clin Immunol</source>
          <year>2015</year>
          <month>08</month>
          <day>29</day>
          <volume>11</volume>
          <issue>11</issue>
          <fpage>1205</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.1586/1744666x.2015.1081814</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cardell</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Olsson</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Andersson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Welin</surname>
              <given-names>KO</given-names>
            </name>
            <name name-style="western">
              <surname>Svensson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tennvall</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Hellgren</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>TOTALL: high cost of allergic rhinitis-a national Swedish population-based questionnaire study</article-title>
          <source>NPJ Prim Care Respir Med</source>
          <year>2016</year>
          <month>02</month>
          <day>04</day>
          <volume>26</volume>
          <issue>1</issue>
          <fpage>15082</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/npjpcrm.2015.82"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/npjpcrm.2015.82</pub-id>
          <pub-id pub-id-type="medline">26845513</pub-id>
          <pub-id pub-id-type="pii">npjpcrm201582</pub-id>
          <pub-id pub-id-type="pmcid">PMC4741287</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Terreehorst</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Hak</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Oosting</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Tempels-Pavlica</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>de Monchy</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Bruijnzeel-Koomen</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Aalberse</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Gerth van Wijk</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of impermeable covers for bedding in patients with allergic rhinitis</article-title>
          <source>N Engl J Med</source>
          <year>2003</year>
          <month>07</month>
          <day>17</day>
          <volume>349</volume>
          <issue>3</issue>
          <fpage>237</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://core.ac.uk/reader/19184690?utm_source=linkout"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMoa023171</pub-id>
          <pub-id pub-id-type="medline">12867607</pub-id>
          <pub-id pub-id-type="pii">349/3/237</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Increasing prevalence of allergic rhinitis in China</article-title>
          <source>Allergy Asthma Immunol Res</source>
          <year>2019</year>
          <month>03</month>
          <volume>11</volume>
          <issue>2</issue>
          <fpage>156</fpage>
          <lpage>69</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30661309"/>
          </comment>
          <pub-id pub-id-type="doi">10.4168/aair.2019.11.2.156</pub-id>
          <pub-id pub-id-type="medline">30661309</pub-id>
          <pub-id pub-id-type="pii">11.156</pub-id>
          <pub-id pub-id-type="pmcid">PMC6340797</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Niu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Shan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Guan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ruan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Cong</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Analysis of prevalence and risk factors of adult self-reported allergic rhinitis and asthma in plain lands and hilly areas of Shenmu City, China</article-title>
          <source>Front Public Health</source>
          <year>2021</year>
          <month>1</month>
          <day>4</day>
          <volume>9</volume>
          <fpage>749388</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35059372"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpubh.2021.749388</pub-id>
          <pub-id pub-id-type="medline">35059372</pub-id>
          <pub-id pub-id-type="pmcid">PMC8765605</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Bensi</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Baecher</surname>
              <given-names>GB</given-names>
            </name>
          </person-group>
          <article-title>Dynamic assessment of the COVID-19 vaccine acceptance leveraging social media data</article-title>
          <source>J Biomed Inform</source>
          <year>2022</year>
          <month>05</month>
          <volume>129</volume>
          <fpage>104054</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(22)00070-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2022.104054</pub-id>
          <pub-id pub-id-type="medline">35331966</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(22)00070-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC8935963</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Castillo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Benitez</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Llorens</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Social media-driven customer engagement and movie performance: theory and empirical evidence</article-title>
          <source>Decis Support Syst</source>
          <year>2021</year>
          <month>06</month>
          <volume>145</volume>
          <fpage>113516</fpage>
          <pub-id pub-id-type="doi">10.1016/j.dss.2021.113516</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stieglitz</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dang-Xuan</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Emotions and information diffusion in social media—sentiment of microblogs and sharing behavior</article-title>
          <source>J Manag Inf Syst</source>
          <year>2014</year>
          <month>12</month>
          <day>08</day>
          <volume>29</volume>
          <issue>4</issue>
          <fpage>217</fpage>
          <lpage>48</lpage>
          <pub-id pub-id-type="doi">10.2753/MIS0742-1222290408</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Srinivasan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wen-Huang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zomaya</surname>
              <given-names>AY</given-names>
            </name>
          </person-group>
          <article-title>Hybrid context enriched deep learning model for fine-grained sentiment analysis in textual and visual semiotic modality social data</article-title>
          <source>Inf Process Manag</source>
          <year>2020</year>
          <month>01</month>
          <volume>57</volume>
          <issue>1</issue>
          <fpage>102141</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ipm.2019.102141</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Finding useful solutions in online knowledge communities: a theory-driven design and multilevel analysis</article-title>
          <source>Inf Syst Res</source>
          <year>2020</year>
          <month>09</month>
          <volume>31</volume>
          <issue>3</issue>
          <fpage>731</fpage>
          <lpage>52</lpage>
          <pub-id pub-id-type="doi">10.1287/isre.2019.0911</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lindelöf</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Aledavood</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Keller</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Dynamics of the negative discourse toward COVID-19 vaccines: topic modeling study and an annotated data set of Twitter posts</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>04</month>
          <day>12</day>
          <volume>25</volume>
          <fpage>e41319</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e41319/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/41319</pub-id>
          <pub-id pub-id-type="medline">36877804</pub-id>
          <pub-id pub-id-type="pii">v25i1e41319</pub-id>
          <pub-id pub-id-type="pmcid">PMC10134018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Public attitudes toward anxiety disorder on Sina Weibo: content analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>04</month>
          <day>04</day>
          <volume>25</volume>
          <fpage>e45777</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e45777/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/45777</pub-id>
          <pub-id pub-id-type="medline">37014691</pub-id>
          <pub-id pub-id-type="pii">v25i1e45777</pub-id>
          <pub-id pub-id-type="pmcid">PMC10131780</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Whinston</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Cetintas</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>KC</given-names>
            </name>
          </person-group>
          <article-title>Enhancing social media analysis with visual data analytics: a deep learning approach</article-title>
          <source>MIS Q</source>
          <year>2020</year>
          <month>12</month>
          <day>1</day>
          <volume>44</volume>
          <issue>4</issue>
          <fpage>1459</fpage>
          <lpage>92</lpage>
          <pub-id pub-id-type="doi">10.25300/MISQ/2020/14870</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Paul</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>You are what you tweet: analyzing Twitter for public health</article-title>
          <source>Proc Int AAAI Conf Web Social Media</source>
          <year>2021</year>
          <month>08</month>
          <day>03</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>265</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1609/icwsm.v5i1.14137</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pradeepa</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Manjula</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Vimal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Chilamkurti</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Luhach</surname>
              <given-names>AK</given-names>
            </name>
          </person-group>
          <article-title>DRFS: detecting risk factor of stroke disease from social media using machine learning techniques</article-title>
          <source>Neural Process Lett</source>
          <year>2020</year>
          <month>06</month>
          <day>09</day>
          <volume>55</volume>
          <issue>4</issue>
          <fpage>3843</fpage>
          <lpage>61</lpage>
          <pub-id pub-id-type="doi">10.1007/s11063-020-10279-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Understanding medication nonadherence from social media: a sentiment-enriched deep learning approach</article-title>
          <source>MIS Q</source>
          <year>2022</year>
          <month>02</month>
          <day>25</day>
          <volume>46</volume>
          <issue>1</issue>
          <fpage>341</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.25300/MISQ/2022/15336</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Navale</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>McAuliffe</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The integration of a canonical workflow framework with an informatics system for disease area research</article-title>
          <source>Data Intell</source>
          <year>2022</year>
          <volume>4</volume>
          <issue>2</issue>
          <fpage>186</fpage>
          <lpage>95</lpage>
          <pub-id pub-id-type="doi">10.1162/dint_a_00125</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lan</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Advances and highlights in allergic rhinitis</article-title>
          <source>Allergy</source>
          <year>2021</year>
          <month>11</month>
          <day>17</day>
          <volume>76</volume>
          <issue>11</issue>
          <fpage>3383</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1111/all.15044</pub-id>
          <pub-id pub-id-type="medline">34379805</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chiang</surname>
              <given-names>TY</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Shie</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>CF</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>CC</given-names>
            </name>
          </person-group>
          <article-title>Increased incidence of allergic rhinitis, bronchitis and asthma, in children living near a petrochemical complex with SO pollution</article-title>
          <source>Environ Int</source>
          <year>2016</year>
          <month>11</month>
          <volume>96</volume>
          <fpage>1</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1016/j.envint.2016.08.009</pub-id>
          <pub-id pub-id-type="medline">27585759</pub-id>
          <pub-id pub-id-type="pii">S0160-4120(16)30299-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kurganskiy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Creer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>de Vere</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Griffith</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Osborne</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wheeler</surname>
              <given-names>BW</given-names>
            </name>
            <name name-style="western">
              <surname>McInnes</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>Clewlow</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Barber</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>GL</given-names>
            </name>
            <name name-style="western">
              <surname>Hanlon</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Hegarty</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Potter</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rowney</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Adams-Groom</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Petch</surname>
              <given-names>GM</given-names>
            </name>
            <name name-style="western">
              <surname>Pashley</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Satchwell</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>de Weger</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Rasmussen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Oliver</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Sindt</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bruffaerts</surname>
              <given-names>N</given-names>
            </name>
            <collab>PollerGEN Consortium</collab>
            <name name-style="western">
              <surname>Skjøth</surname>
              <given-names>CA</given-names>
            </name>
          </person-group>
          <article-title>Predicting the severity of the grass pollen season and the effect of climate change in Northwest Europe</article-title>
          <source>Sci Adv</source>
          <year>2021</year>
          <month>03</month>
          <day>26</day>
          <volume>7</volume>
          <issue>13</issue>
          <fpage>eabd7658</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.science.org/doi/abs/10.1126/sciadv.abd7658?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/sciadv.abd7658</pub-id>
          <pub-id pub-id-type="medline">33771862</pub-id>
          <pub-id pub-id-type="pii">7/13/eabd7658</pub-id>
          <pub-id pub-id-type="pmcid">PMC7997511</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JY</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Huh</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Moon</surname>
              <given-names>KW</given-names>
            </name>
          </person-group>
          <article-title>Association between environmental exposure to phthalates and allergic disorders in Korean children: Korean National Environmental Health Survey (KoNEHS) 2015-2017</article-title>
          <source>Int J Hyg Environ Health</source>
          <year>2021</year>
          <month>09</month>
          <volume>238</volume>
          <fpage>113857</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ijheh.2021.113857</pub-id>
          <pub-id pub-id-type="medline">34644676</pub-id>
          <pub-id pub-id-type="pii">S1438-4639(21)00172-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Paciência</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cavaleiro Rufo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Silva</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mendes</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Farraia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Delgado</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Padrão</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Moreira</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Severo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moreira</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Effects of indoor endocrine-disrupting chemicals on childhood rhinitis</article-title>
          <source>J Investig Allergol Clin Immunol</source>
          <year>2020</year>
          <month>6</month>
          <day>18</day>
          <volume>30</volume>
          <issue>3</issue>
          <fpage>195</fpage>
          <lpage>97</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jiaci.org/summary/vol30-issue3-num2022"/>
          </comment>
          <pub-id pub-id-type="doi">10.18176/jiaci.0471</pub-id>
          <pub-id pub-id-type="medline">31833476</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saulyte</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Regueira</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Montes-Martínez</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Khudyakov</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Takkouche</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Active or passive exposure to tobacco smoking and allergic rhinitis, allergic dermatitis, and food allergy in adults and children: a systematic review and meta-analysis</article-title>
          <source>PLoS Med</source>
          <year>2014</year>
          <month>03</month>
          <day>11</day>
          <volume>11</volume>
          <issue>3</issue>
          <fpage>e1001611</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pmed.1001611"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pmed.1001611</pub-id>
          <pub-id pub-id-type="medline">24618794</pub-id>
          <pub-id pub-id-type="pii">PMEDICINE-D-13-00926</pub-id>
          <pub-id pub-id-type="pmcid">PMC3949681</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>IG</given-names>
            </name>
            <name name-style="western">
              <surname>Rhee</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Yim</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>DH</given-names>
            </name>
          </person-group>
          <article-title>Association between perceived stress and rhinitis-related quality of life: a multicenter, cross-sectional study</article-title>
          <source>J Clin Med</source>
          <year>2021</year>
          <month>08</month>
          <day>19</day>
          <volume>10</volume>
          <issue>16</issue>
          <fpage>3680</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=jcm10163680"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/jcm10163680</pub-id>
          <pub-id pub-id-type="medline">34441978</pub-id>
          <pub-id pub-id-type="pii">jcm10163680</pub-id>
          <pub-id pub-id-type="pmcid">PMC8397163</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Han</surname>
              <given-names>YY</given-names>
            </name>
            <name name-style="western">
              <surname>Forno</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gogna</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Celedón</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Obesity and rhinitis in a nationwide study of children and adults in the United States</article-title>
          <source>J Allergy Clin Immunol</source>
          <year>2016</year>
          <month>05</month>
          <volume>137</volume>
          <issue>5</issue>
          <fpage>1460</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26883461"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jaci.2015.12.1307</pub-id>
          <pub-id pub-id-type="medline">26883461</pub-id>
          <pub-id pub-id-type="pii">S0091-6749(16)00084-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC4860058</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kanazawa</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Masuko</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yatagai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sakamoto</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Yamada</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kitazawa</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Iijima</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Naito</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Saito</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Noguchi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hirota</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tamari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hizawa</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Association analyses of eQTLs of the TYRO3 gene and allergic diseases in Japanese populations</article-title>
          <source>Allergol Int</source>
          <year>2019</year>
          <month>01</month>
          <volume>68</volume>
          <issue>1</issue>
          <fpage>77</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1323-8930(18)30087-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.alit.2018.07.004</pub-id>
          <pub-id pub-id-type="medline">30082152</pub-id>
          <pub-id pub-id-type="pii">S1323-8930(18)30087-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alm</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Goksör</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Pettersson</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Möllborg</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Erdes</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Loid</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Aberg</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wennergren</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Antibiotics in the first week of life is a risk factor for allergic rhinitis at school age</article-title>
          <source>Pediatr Allergy Immunol</source>
          <year>2014</year>
          <month>08</month>
          <day>09</day>
          <volume>25</volume>
          <issue>5</issue>
          <fpage>468</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24912441"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/pai.12244</pub-id>
          <pub-id pub-id-type="medline">24912441</pub-id>
          <pub-id pub-id-type="pmcid">PMC4282316</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>WF</given-names>
            </name>
          </person-group>
          <article-title>Risk factor analysis of allergic rhinitis in 6-8 year-old children in Taipei</article-title>
          <source>PLoS One</source>
          <year>2021</year>
          <month>4</month>
          <day>2</day>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>e0249572</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0249572"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0249572</pub-id>
          <pub-id pub-id-type="medline">33798255</pub-id>
          <pub-id pub-id-type="pii">PONE-D-20-25855</pub-id>
          <pub-id pub-id-type="pmcid">PMC8018651</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ram</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A comprehensive analysis of triggers and risk factors for asthma based on machine learning and large heterogeneous data sources</article-title>
          <source>MIS Q</source>
          <year>2020</year>
          <month>01</month>
          <day>01</day>
          <volume>44</volume>
          <issue>1</issue>
          <fpage>305</fpage>
          <lpage>49</lpage>
          <pub-id pub-id-type="doi">10.25300/misq/2020/15106</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Griffis</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Asch</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Buttenheim</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Barg</surname>
              <given-names>FK</given-names>
            </name>
            <name name-style="western">
              <surname>Mitra</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Using social media to track geographic variability in language about diabetes: analysis of diabetes-related tweets across the United States</article-title>
          <source>JMIR Diabetes</source>
          <year>2020</year>
          <month>01</month>
          <day>26</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>e14431</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://diabetes.jmir.org/2020/1/e14431/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/14431</pub-id>
          <pub-id pub-id-type="medline">32044757</pub-id>
          <pub-id pub-id-type="pii">v5i1e14431</pub-id>
          <pub-id pub-id-type="pmcid">PMC7055793</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schäfer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Faviez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Voillot</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Foulquié</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Najm</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jeanne</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Fagherazzi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Schück</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Le Nevé</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Mapping and modeling of discussions related to gastrointestinal discomfort in French-speaking online forums: results of a 15-year retrospective infodemiology study</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>11</month>
          <day>03</day>
          <volume>22</volume>
          <issue>11</issue>
          <fpage>e17247</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/11/e17247/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/17247</pub-id>
          <pub-id pub-id-type="medline">33141087</pub-id>
          <pub-id pub-id-type="pii">v22i11e17247</pub-id>
          <pub-id pub-id-type="pmcid">PMC7671840</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oyebode</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Orji</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Detecting factors responsible for diabetes prevalence in Nigeria using social media and machine learning</article-title>
          <source>Proceedings of the 15th International Conference on Network and Service Management (CNSM)</source>
          <year>2019</year>
          <conf-name>15th International Conference on Network and Service Management (CNSM)</conf-name>
          <conf-date>October 21-25, 2019</conf-date>
          <conf-loc>Halifax, NS</conf-loc>
          <pub-id pub-id-type="doi">10.23919/cnsm46954.2019.9012679</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ramsingh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bhuvaneswari</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>A big data framework to analyze risk factors of diabetes outbreak in indian population using a map reduce algorithm</article-title>
          <source>Proceedings of the Second International Conference on Intelligent Computing and Control Systems (ICICCS)</source>
          <year>2018</year>
          <conf-name>Second International Conference on Intelligent Computing and Control Systems (ICICCS)</conf-name>
          <conf-date>June 14-15, 2018</conf-date>
          <conf-loc>Madurai, India</conf-loc>
          <pub-id pub-id-type="doi">10.1109/iccons.2018.8663143</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ramsingh</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bhuvaneswari</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>An integrated multi-node Hadoop framework to predict high-risk factors of diabetes mellitus using a multilevel MapReduce based fuzzy classifier (MMR-FC) and modified DBSCAN algorithm</article-title>
          <source>Appl Soft Comput</source>
          <year>2021</year>
          <month>09</month>
          <volume>108</volume>
          <fpage>107423</fpage>
          <pub-id pub-id-type="doi">10.1016/j.asoc.2021.107423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alswedani</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mehmood</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Katib</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Altowaijri</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Psychological health and drugs: data-driven discovery of causes, treatments, effects, and abuses</article-title>
          <source>Toxics</source>
          <year>2023</year>
          <month>03</month>
          <day>20</day>
          <volume>11</volume>
          <issue>3</issue>
          <fpage>102681</fpage>
          <pub-id pub-id-type="doi">10.3390/toxics11030287</pub-id>
          <pub-id pub-id-type="medline">36977052</pub-id>
          <pub-id pub-id-type="pii">toxics11030287</pub-id>
          <pub-id pub-id-type="pmcid">PMC10053492</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Mustapha</surname>
              <given-names>IZ</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Discourse about human papillomavirus (HPV)-associated oropharyngeal cancer (OPC) on Twitter: lessons for public health education about OPC and dental care</article-title>
          <source>Public Health Pract (Oxf)</source>
          <year>2022</year>
          <month>06</month>
          <volume>3</volume>
          <fpage>100239</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2666-5352(22)00015-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.puhip.2022.100239</pub-id>
          <pub-id pub-id-type="medline">36101754</pub-id>
          <pub-id pub-id-type="pii">S2666-5352(22)00015-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC9461587</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Neisani Samani</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Karimi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Alesheikh</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Environmental and infrastructural effects on respiratory disease exacerbation: a LBSN and ANN-based spatio-temporal modelling</article-title>
          <source>Environ Monit Assess</source>
          <year>2020</year>
          <month>01</month>
          <day>04</day>
          <volume>192</volume>
          <issue>2</issue>
          <fpage>90</fpage>
          <pub-id pub-id-type="doi">10.1007/s10661-019-7987-x</pub-id>
          <pub-id pub-id-type="medline">31902018</pub-id>
          <pub-id pub-id-type="pii">10.1007/s10661-019-7987-x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Distributed representations of words and phrases and their compositionality</article-title>
          <source>arXiv. Preprint posted online October 16, 2013</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1310.4546"/>
          </comment>
          <pub-id pub-id-type="doi">10.5555/2999792.2999959</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Learning sentiment-specific word embedding for Twitter sentiment classification</article-title>
          <source>Proceedings of the 52nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)</source>
          <year>2014</year>
          <conf-name>52nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)</conf-name>
          <conf-date>June 22-27, 2014</conf-date>
          <conf-loc>Baltimore, MD</conf-loc>
          <pub-id pub-id-type="doi">10.3115/v1/p14-1146</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yilmaz</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Toklu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A deep learning analysis on question classification task using Word2vec representations</article-title>
          <source>Neural Comput Appl</source>
          <year>2020</year>
          <month>01</month>
          <day>21</day>
          <volume>32</volume>
          <issue>7</issue>
          <fpage>2909</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.1007/s00521-020-04725-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Bing</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Learning domain-sensitive and sentiment-aware word embeddings</article-title>
          <source>Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)</source>
          <year>2018</year>
          <conf-name>56th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)</conf-name>
          <conf-date>July 15-20, 2018</conf-date>
          <conf-loc>Melbourne, Australia</conf-loc>
          <pub-id pub-id-type="doi">10.18653/v1/p18-1232</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Convolutional neural networks for sentence classification</article-title>
          <source>Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP)</source>
          <year>2014</year>
          <conf-name>2014 Conference on Empirical Methods in Natural Language Processing (EMNLP)</conf-name>
          <conf-date>October 25-29, 2014</conf-date>
          <conf-loc>Doha, Qatar</conf-loc>
          <pub-id pub-id-type="doi">10.3115/v1/d14-1181</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zaremba</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Vinyals</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Recurrent neural network regularization</article-title>
          <source>arXiv. Preprint posted online September 8, 2014</source>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1409.2329"/>
          </comment>
          <pub-id pub-id-type="doi">10.48550/ARXIV.1409.2329</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vaswani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shazeer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Parmar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Uszkoreit</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gomez</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Polosukhin</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Attention is all you need</article-title>
          <source>arXiv. Preprint posted online June 12, 2017</source>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Moe</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Measuring brand favorability using large-scale social media data</article-title>
          <source>Inf Syst Res</source>
          <year>2021</year>
          <month>12</month>
          <volume>32</volume>
          <issue>4</issue>
          <fpage>1128</fpage>
          <lpage>39</lpage>
          <pub-id pub-id-type="doi">10.1287/isre.2021.1030</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abbasi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Adjeroh</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Abate</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Don’t mention it? Analyzing user-generated content signals for early adverse event warnings</article-title>
          <source>Inf Syst Res</source>
          <year>2019</year>
          <month>09</month>
          <volume>30</volume>
          <issue>3</issue>
          <fpage>1007</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.1287/isre.2019.0847</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wan</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>AOL4PS: a large-scale data set for personalized search</article-title>
          <source>Data Intell</source>
          <year>2021</year>
          <volume>3</volume>
          <issue>4</issue>
          <fpage>548</fpage>
          <lpage>67</lpage>
          <pub-id pub-id-type="doi">10.1162/dint_a_00104</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khatua</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Khatua</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cambria</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>A tale of two epidemics: contextual Word2Vec for classifying Twitter streams during outbreaks</article-title>
          <source>Inf Process Manag</source>
          <year>2019</year>
          <month>01</month>
          <volume>56</volume>
          <issue>1</issue>
          <fpage>247</fpage>
          <lpage>57</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ipm.2018.10.010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>An analysis of cognitive change in online mental health communities: a textual data analysis based on post replies of support seekers</article-title>
          <source>Inf Process Manag</source>
          <year>2023</year>
          <month>03</month>
          <volume>60</volume>
          <issue>2</issue>
          <fpage>103192</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ipm.2022.103192</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eysenbach</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Till</surname>
              <given-names>JE</given-names>
            </name>
          </person-group>
          <article-title>Ethical issues in qualitative research on internet communities</article-title>
          <source>BMJ</source>
          <year>2001</year>
          <month>11</month>
          <day>10</day>
          <volume>323</volume>
          <issue>7321</issue>
          <fpage>1103</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/11701577"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj.323.7321.1103</pub-id>
          <pub-id pub-id-type="medline">11701577</pub-id>
          <pub-id pub-id-type="pmcid">PMC59687</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Thread detection in dynamic text message streams</article-title>
          <source>Proceedings of the 29th annual international ACM SIGIR conference on Research and development in information retrieval</source>
          <year>2006</year>
          <conf-name>SIGIR '06</conf-name>
          <conf-date>August 6-11, 2006</conf-date>
          <conf-loc>Seattle, WA</conf-loc>
          <pub-id pub-id-type="doi">10.1145/1148170.1148180</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mihalcea</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tarau</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>TextRank: bringing order into text</article-title>
          <source>Proceedings of the 2004 Conference on Empirical Methods in Natural Language Processing</source>
          <year>2004</year>
          <conf-name>2004 Conference on Empirical Methods in Natural Language Processing</conf-name>
          <conf-date>July 25-26, 2004</conf-date>
          <conf-loc>Barcelona, Spain</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/W04-3252.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Long</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yan</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Rank-IDF: a statistical and network based feature words selection in big data text analysis</article-title>
          <source>Proceedings of the 2020 5th International Conference on Mathematics and Artificial Intelligence</source>
          <year>2020</year>
          <conf-name>ICMAI '20</conf-name>
          <conf-date>April 10-13, 2020</conf-date>
          <conf-loc>Chengdu, China</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3395260.3395291</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Chau</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Matthew Gladden</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sumner</surname>
              <given-names>SA</given-names>
            </name>
          </person-group>
          <article-title>Detection of emerging drugs involved in overdose via diachronic word embeddings of substances discussed on social media</article-title>
          <source>J Biomed Inform</source>
          <year>2021</year>
          <month>07</month>
          <volume>119</volume>
          <fpage>103824</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(21)00153-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2021.103824</pub-id>
          <pub-id pub-id-type="medline">34048933</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(21)00153-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Unintended emotional effects of online health communities: a text mining-supported empirical study</article-title>
          <source>MIS Q</source>
          <year>2023</year>
          <month>03</month>
          <day>01</day>
          <volume>47</volume>
          <issue>1</issue>
          <fpage>195</fpage>
          <lpage>226</lpage>
          <pub-id pub-id-type="doi">10.25300/misq/2022/17018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gangl</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Reininger</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bernhard</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Campana</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Pree</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Reisinger</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kneidinger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kundi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dolznig</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Thurnher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Valent</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Vrtala</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Spitzauer</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Valenta</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Niederberger</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Cigarette smoke facilitates allergen penetration across respiratory epithelium</article-title>
          <source>Allergy</source>
          <year>2009</year>
          <month>03</month>
          <day>23</day>
          <volume>64</volume>
          <issue>3</issue>
          <fpage>398</fpage>
          <lpage>405</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1398-9995.2008.01861.x</pub-id>
          <pub-id pub-id-type="medline">19120070</pub-id>
          <pub-id pub-id-type="pii">ALL1861</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lian</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Detection of dermatophagoides farinae in the dust of air conditioning filters</article-title>
          <source>Int Arch Allergy Immunol</source>
          <year>2007</year>
          <month>8</month>
          <day>10</day>
          <volume>144</volume>
          <issue>1</issue>
          <fpage>85</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="doi">10.1159/000102619</pub-id>
          <pub-id pub-id-type="medline">17505140</pub-id>
          <pub-id pub-id-type="pii">000102619</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schenkel</surname>
              <given-names>EJ</given-names>
            </name>
          </person-group>
          <article-title>Effect of desloratadine on the control of morning symptoms in patients with seasonal and perennial allergic rhinitis</article-title>
          <source>Allergy Asthma Proc</source>
          <year>2006</year>
          <month>11</month>
          <day>01</day>
          <volume>27</volume>
          <issue>6</issue>
          <fpage>465</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.2500/aap.2006.27.2936</pub-id>
          <pub-id pub-id-type="medline">17176780</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
