<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v22i11e17247</article-id>
      <article-id pub-id-type="pmid">33141087</article-id>
      <article-id pub-id-type="doi">10.2196/17247</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Mapping and Modeling of Discussions Related to Gastrointestinal Discomfort in French-Speaking Online Forums: Results of a 15-Year Retrospective Infodemiology Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Pougheon Bertrand</surname>
            <given-names>Dominique</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Lamy</surname>
            <given-names>Francois</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Schäfer</surname>
            <given-names>Florent</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Innovation Science and Nutrition</institution>
            <institution>Danone Nutricia Research</institution>
            <addr-line>RD 128 Avenue de la Vauve</addr-line>
            <addr-line>Palaiseau, 91767</addr-line>
            <country>France</country>
            <phone>33 1 69 35 70 00</phone>
            <email>florent.schafer@danone.com</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6816-5731</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Faviez</surname>
            <given-names>Carole</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1500-0236</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Voillot</surname>
            <given-names>Paméla</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7156-9075</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Foulquié</surname>
            <given-names>Pierre</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4485-0835</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Najm</surname>
            <given-names>Matthieu</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9757-1499</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Jeanne</surname>
            <given-names>Jean-François</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5074-4679</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Fagherazzi</surname>
            <given-names>Guy</given-names>
          </name>
          <degrees>MSc, PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5033-5966</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Schück</surname>
            <given-names>Stéphane</given-names>
          </name>
          <degrees>MSc, MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2642-7726</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Le Nevé</surname>
            <given-names>Boris</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3892-9045</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Innovation Science and Nutrition</institution>
        <institution>Danone Nutricia Research</institution>
        <addr-line>Palaiseau</addr-line>
        <country>France</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Kap Code</institution>
        <addr-line>Paris</addr-line>
        <country>France</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Deep Digital Phenotyping Research Unit</institution>
        <institution>Department of Population Health</institution>
        <institution>Luxembourg Institute of Health</institution>
        <addr-line>Strassen</addr-line>
        <country>Luxembourg</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Center of Research in Epidemiology and Population Health</institution>
        <institution>UMR 1018 Inserm, Institut Gustave Roussy</institution>
        <institution>Paris-Sud Paris-Saclay University</institution>
        <addr-line>Villejuif</addr-line>
        <country>France</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Florent Schäfer <email>florent.schafer@danone.com</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>11</month>
        <year>2020</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>3</day>
        <month>11</month>
        <year>2020</year>
      </pub-date>
      <volume>22</volume>
      <issue>11</issue>
      <elocation-id>e17247</elocation-id>
      <history>
        <date date-type="received">
          <day>28</day>
          <month>11</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>10</day>
          <month>3</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>30</day>
          <month>4</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>25</day>
          <month>6</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Florent Schäfer, Carole Faviez, Paméla Voillot, Pierre Foulquié, Matthieu Najm, Jean-François Jeanne, Guy Fagherazzi, Stéphane Schück, Boris Le Nevé. Originally published in the Journal of Medical Internet Research (http://www.jmir.org), 03.11.2020.</copyright-statement>
      <copyright-year>2020</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on http://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2020/11/e17247" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Gastrointestinal (GI) discomfort is prevalent and known to be associated with impaired quality of life. Real-world information on factors of GI discomfort and solutions used by people is, however, limited. Social media, including online forums, have been considered a new source of information to examine the health of populations in real-life settings.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aims of this retrospective infodemiology study are to identify discussion topics, characterize users, and identify perceived determinants of GI discomfort in web-based messages posted by users of French social media.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Messages related to GI discomfort posted between January 2003 and August 2018 were extracted from 14 French-speaking general and specialized publicly available online forums. Extracted messages were cleaned and deidentified. Relevant medical concepts were determined on the basis of the Medical Dictionary for Regulatory Activities and vernacular terms. The identification of discussion topics was carried out by using a correlated topic model on the basis of the latent Dirichlet allocation. A nonsupervised clustering algorithm was applied to cluster forum users according to the reported symptoms of GI discomfort, discussion topics, and activity on online forums. Users’ age and gender were determined by linear regression and application of a support vector machine, respectively, to characterize the identified clusters according to demographic parameters. Perceived factors of GI discomfort were classified by a combined method on the basis of syntactic analysis to identify messages with causality terms and a second topic modeling in a relevant segment of phrases.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>A total of 198,866 messages associated with GI discomfort were included in the analysis corpus after extraction and cleaning. These messages were posted by 36,989 separate web users, most of them being women younger than 40 years. Everyday life, diet, digestion, abdominal pain, impact on the quality of life, and tips to manage stress were among the most discussed topics. Segmentation of users identified 5 clusters corresponding to chronic and acute GI concerns. Diet topic was associated with each cluster, and stress was strongly associated with abdominal pain. Psychological factors, food, and allergens were perceived as the main causes of GI discomfort by web users.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>GI discomfort is actively discussed by web users. This study reveals a complex relationship between food, stress, and GI discomfort. Our approach has shown that identifying web-based discussion topics associated with GI discomfort and its perceived factors is feasible and can serve as a complementary source of real-world evidence for caregivers.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>gastrointestinal discomfort</kwd>
        <kwd>disorders of gut-brain interactions</kwd>
        <kwd>social media</kwd>
        <kwd>infodemiology</kwd>
        <kwd>topic modeling</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <sec>
          <title>Gastrointestinal Discomfort: Prevalence, Impact on Quality of Life, and Management</title>
          <p>Gastrointestinal (GI) discomfort (eg, bloating, abdominal pain, constipation) is very common in the general population, with a known impact on well-being [<xref ref-type="bibr" rid="ref1">1</xref>]. Chronic and severe symptoms of GI discomfort are associated with a significant decrease in quality of life [<xref ref-type="bibr" rid="ref2">2</xref>]. Irritable bowel syndrome (IBS) is the most studied condition among disorders of gut-brain interactions (DGBIs) [<xref ref-type="bibr" rid="ref3">3</xref>], with a highly heterogeneous prevalence ranging from 1.1% in France and Iran to 35.5% in Mexico [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Associated socioeconomic costs are significant because of the important use of health care resources and work absenteeism [<xref ref-type="bibr" rid="ref6">6</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. However, the etiology of DGBIs remains to be poorly understood. Among the pathophysiological mechanisms associated with IBS, GI sensory-motor alterations [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>], signs of discrete immune dysfunction [<xref ref-type="bibr" rid="ref11">11</xref>], and increased intestinal permeability [<xref ref-type="bibr" rid="ref12">12</xref>] are considered important. The possible involvement of gut microbiota in the pathogenesis of GI diseases and the occurrence of GI symptoms has also been explored, as the severity of IBS symptoms is associated with specific intestinal microbiota profiles [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
          <p>Psychological comorbidities are commonly associated with GI symptoms, and the prevalence of anxiety and depression among people with IBS is estimated to be at least two to three times the rate in the general population [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>]. Concerning women with abdominal pain, cramping, and discomfort, a recent web-based cross-sectional survey study [<xref ref-type="bibr" rid="ref16">16</xref>] showed that 96 % of women reported that daily activities were disrupted at least sometimes by abdominal pain, cramping, and discomfort and 44 % of women reported that daily activities were disrupted at least often. Other aspects of quality of life, such as quality of work, eating habits, and social activities were also affected in most women [<xref ref-type="bibr" rid="ref16">16</xref>].</p>
          <p>DGBIs are the source of important health care consumption (consultations, complementary examinations and hospitalizations), although difficult to quantify [<xref ref-type="bibr" rid="ref17">17</xref>], given their chronic nature and the absence of specific diagnostic tests in the case of IBS [<xref ref-type="bibr" rid="ref18">18</xref>]. In France, a cross-sectional study estimated the average annual direct cost to be €756 (US $888) for one patient and more than 3 days of sick leave per year [<xref ref-type="bibr" rid="ref17">17</xref>]. Another study conducted in the United Kingdom [<xref ref-type="bibr" rid="ref19">19</xref>] estimated the total cost of DGBIs in infants to be at least £72.3 (US $93.7) million per year in 2014 to 2015, of which £49.1 (US $63.6) million was the National Health Service expenditure on prescriptions, community care, and hospital treatment.</p>
          <p>The role of diet in the pathogenesis of IBS has already been highlighted [<xref ref-type="bibr" rid="ref20">20</xref>], and food is perceived as a factor of GI discomfort even in the absence of diagnosed allergy or malabsorption [<xref ref-type="bibr" rid="ref21">21</xref>]. The management of DGBIs especially relies on lifestyle, including physical activity and dietary measures. Available guidelines [<xref ref-type="bibr" rid="ref22">22</xref>] recommend regular meal patterns, avoidance of large meals, and reduced intake of fat, alcohol, spicy foods, insoluble fibers, caffeine, and gas-producing foods such as beans, cabbage, and onions. Eating meals in a quiet place (for about at least 20 min, without working) with sufficient chewing and hydration (1.5 to 2 liters per day) is also recommended [<xref ref-type="bibr" rid="ref22">22</xref>]. Dietary interventions (probiotics, prebiotics, and synbiotics) and restriction diets (eg, low-fermentable oligosaccharides, disaccharides, monosaccharides, and polyols, also known as low-FODMAP diet) have also been explored as potential therapeutic solutions in IBS [<xref ref-type="bibr" rid="ref23">23</xref>]. Available pharmacological treatments targeting either the GI tract or the brain have also shown some therapeutic value and include antidepressants, prokinetic agents, and painkillers [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
        </sec>
        <sec>
          <title>Social Media as a Real-World Health Data Source</title>
          <p>The penetration of social media into modern society has become a global cultural phenomenon. Patients use peer-to-peer virtual communities and social media to share their experiences regarding their treatments and diseases. The use of social media allows large groups of people to create and share information, opinions, and experiences about health conditions and medications through web-based discussion [<xref ref-type="bibr" rid="ref25">25</xref>]. Social media can therefore be considered as a new data source to assess population health and quality of life, understand adherence to treatments, or identify adverse drug reactions. Patients highlighted the benefit of web-based interactions with other patients. For example, sharing information through social networks enabled patients to better communicate with health care providers. Patients often use social media to discuss drug side effects, quality of life and adherence to therapies. To analyze such data, which can be voluminous, appropriate tools are needed. Text mining techniques allow the classification and summarization of text data such as messages [<xref ref-type="bibr" rid="ref26">26</xref>]. This set of techniques has been used to extract information from electronic health records [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. They have also been used for various use cases with social media data. Some authors [<xref ref-type="bibr" rid="ref29">29</xref>] studied the messages from patients with breast cancer treated with aromatase inhibitors. In France, some studies have been published on the misuse and pharmacovigilance signals of methylphenidate [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>], the incorrect use of neuroleptics regarding anxiety [<xref ref-type="bibr" rid="ref32">32</xref>], the safety profile of Levothyrox and the dynamics of its reporting on social media during the summer of 2017 [<xref ref-type="bibr" rid="ref33">33</xref>]. In multiple therapeutic areas, including diabetes and obesity, social media has been considered a real-world health evidence data source [<xref ref-type="bibr" rid="ref34">34</xref>]. Although web-based discussions are unstructured as compared with conventional clinical data, their volume (hundreds of thousands of users) is very important when compared with clinical sets, and this information can therefore be considered as a complementary source of health data in observational research.</p>
        </sec>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>This study was designed to explore perceived GI discomfort and better understand its determinants, on the basis of a retrospective assessment of web-based social media posts, which we considered as a real-life source of health information. In this study, we aimed to answer 3 main research questions: (1) Can we identify topics discussed by web users reporting symptoms of GI discomfort? (2) Can we categorize these users on the basis of the reported symptoms of GI discomfort and level of activity on social media while considering their age and gender? (3) Can we identify the perceived factors causing GI discomfort as reported by web users?</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Sources and Data Extraction</title>
        <p>Messages were retrieved (<xref rid="figure1" ref-type="fig">Figure 1</xref>) from general and specialized French medical web forums. Only messages from publicly available sources were extracted [<xref ref-type="bibr" rid="ref35">35</xref>]. Messages published between January 2003 and August 2018 containing keywords related to GI discomfort were retrieved along with messages from 3 GI discomfort–related subforums of <italic>Doctissimo</italic> [<xref ref-type="bibr" rid="ref36">36</xref>]: (1) <italic>constipation, other transit disorders</italic>; (2) <italic>digestion, heartburn, gastroesophageal reflux disease (GERD);</italic> and (3) <italic>abdominal pain, stomachache and ulcers</italic>. Messages were automatically extracted using the published <italic>Detec’t webcrawler</italic> [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>] developed by Kap Code. A web crawler is an engine that browses through hyperlinks and stores them for future download of associated web pages (identified by the visited hyperlinks) [<xref ref-type="bibr" rid="ref39">39</xref>]. Scraping of messages was performed according to the HTML structure of each forum. All discussions containing at least one of the keywords or one of their synonyms were automatically retrieved with all the associated metadata, deidentified and cleaned (signature and quote withdrawal) before being stored in a study-specific database. A description of the extracted corpus is presented in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. A complete list of the forums that were crawled is presented in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>, and a list of the keywords used for message retrieval is detailed in <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Study framework.</p>
          </caption>
          <graphic xlink:href="jmir_v22i11e17247_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>The corpus is presented in number of messages, one message being one statistical unit. As the total number of extracted messages could not be estimated in advance, no a priori assumption was made about the topics being discussed by web users, the clusters to be segmented, or the perceived factors to be identified, and no sample size was calculated for this observational study.</p>
      </sec>
      <sec>
        <title>Data Exclusion</title>
        <p>The analysis corpus consisted of the corpus cleaned after the removal of messages containing predetermined keywords written in a language other than French, messages containing at least one of the study-specific exclusion words (such as animal-related vocabulary or GI symptoms being used out of context), messages coming from specific URLs and duplicates, as presented in <xref rid="figure2" ref-type="fig">Figure 2</xref>.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Flowchart presenting message extraction.</p>
          </caption>
          <graphic xlink:href="jmir_v22i11e17247_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Statistical Analyses</title>
        <sec>
          <title>Discussion Themes and Topics</title>
          <p>A topic model was applied to identify the themes addressed in the messages. Topic models consist of text mining approaches that aim to automatically identify the abstract themes addressed in a collection of documents. The simplest and most current form of topic models is latent Dirichlet allocation (LDA) [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]. It is based on the hypothesis that each document in the corpus corresponds to a distribution of several topics, these distributions being Dirichlet prior. The modeled topics are probability distributions over the tokens (words or a sequence of several adjacent words) found in the corpus. There is no prior assumption made about the nature of topics present in the corpus under study. These models have already been used to analyze health-related topics within tweets [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>] or online forums [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>].</p>
          <p>For this study, the correlated topic model was used [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]. In addition to being based on LDA [<xref ref-type="bibr" rid="ref44">44</xref>], it considers the existing relations between discussed topics as an additional parameter. The estimated correlation between 2 topics indicates the extent to which these 2 topics emerged simultaneously in posts.</p>
          <p>The modeling of the studied corpus went through different steps so that the topic model could be applied [<xref ref-type="bibr" rid="ref30">30</xref>]. The model was estimated using a variational expectation maximization algorithm [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>], which approximates the posterior distribution of topics on the corpus by finding the best combination of variational parameters. Topics being probability distributions over tokens of the study corpus, they can be characterized by the highest per-topic probability tokens. Weighting these probabilities through term frequency-inverse document frequency (TF-IDF) allows the allocation of higher importance to topic-specific tokens [<xref ref-type="bibr" rid="ref45">45</xref>]. In this case, the per-topic probability of a token was weighted by the inverse of the probabilities of this token in other topics. For each topic, tokens were ranked from highest to lowest weighted TF-IDF value of their probability in this topic [<xref ref-type="bibr" rid="ref45">45</xref>]. For each topic, the first 15 tokens obtained through this ranking were considered the most associated tokens. These were defined as the set of characteristic tokens and used to label each topic. This label should be a synthesis of the characteristic tokens expressed. Correlations between the different topics were measured. Topics were considered associated when correlations were higher than 0.2 in absolute value. This threshold has been set empirically to allow a post to be associated with 5 topics at most. Discussion topics were merged in <italic>groups</italic> of topics on the basis of the values of correlations, and some focus was on categories of interest by applying a new topic model to the associated messages. The analysis was performed using the Structural Topic Model package [<xref ref-type="bibr" rid="ref46">46</xref>] with R environment version 3.5.2.</p>
        </sec>
        <sec>
          <title>User Segmentation</title>
          <p>A nonsupervised clustering algorithm (agglomerative hierarchical clustering) was applied on the data to categorize users according to their activity profile, using 36 different features, from 3 categories: symptoms of GI discomfort, identified topics, and website activity. These categories and features are presented in <xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>.</p>
          <p>A specific list of symptoms related to GI discomfort was established on the basis of the Medical Dictionary for Regulatory Activities (MedDRA) terms and colloquial language [<xref ref-type="bibr" rid="ref37">37</xref>]. For this, a review of the medical dictionary, MedDRA version 15.0, was performed to identify all the terms that may be associated with GI discomfort. Subsequently, these terms were manually grouped by anatomical region or pathophysiological mechanism (esophageal disorders, gastric disorders, GI disorders, pain, appetite disorder, etc). A list of these regions and mechanisms used to group these messages is presented in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>. Fifteen different categories of symptoms were established. A manual enrichment of these groups was made using colloquial language. Automatic screening of messages allowed the identification of specific GI symptoms expressed by web users.</p>
          <p>Website activity of users was measured through different features such as the number of messages, the number of discussions, the dates of the first and last post, the forum name, or the mean posting span. Proportions of posts associated with categories of topics identified for the first objective were considered as the last type of features to describe web users. Created clusters of users were described via identity cards presenting the features that allowed to single them out with their age and gender distribution.</p>
          <p>Web users’ gender was determined through the identification of regular expressions (gendered past participles, adjectives, and names) in messages and the application of a support vector machine on the basis of message content. This method achieves 88% accuracy and is the subject of a pending publication. Web user age categories were identified on the basis of the use of regular expressions of the author’s age in the messages, such as <italic>J’ai 45 ans</italic> (<italic>I am 45 years old</italic>). Each pseudo was associated with one gender (male, female, or unknown) and one age category (20 years or younger, 21-30 years, 31-40 years, 41-50 years, 51-60 years, 61 years or older, and unknown). The generated identification cards (features, age, and gender) were used to characterize each cluster and evaluate whether these characteristics were homogenous between clusters.</p>
        </sec>
        <sec>
          <title>Factors of GI Discomfort</title>
          <p>Factors perceived as responsible for the reported symptoms of GI discomfort were identified using a mixed automated analysis method combining syntactic analysis and topic model. The syntactic analysis was designed to identify (1) the messages containing extracted keywords and a causality term and (2) the sentences and phrases where the causality terms are present. To identify causality, a specific dictionary made of terms associated with causality was created. Causality terms consisted of terms or groups of terms expressing causality in French. These terms could be verbs conjugated at different times and pronouns (eg, <italic>me donne</italic> [makes me], <italic>lui provoquait</italic> [caused/triggered], <italic>entrainent</italic> [lead to/cause], etc), prepositions (eg, <italic>à cause de</italic> [because of/due to], etc), and conjunctions (eg, <italic>dès lors</italic> [since/consequently], <italic>du fait de</italic> [given that], etc).</p>
          <p>Depending on the causality terms, the position of the segment of phrases where factors could be identified was located either before or after the term, as presented in <xref rid="figure3" ref-type="fig">Figure 3</xref>. A topic model was then applied to the sections of messages depending on the direction associated with each causality term. These terms are presented in <xref ref-type="supplementary-material" rid="app6">Multimedia Appendix 6</xref> along with the associated direction of the segment of phrases to be analyzed. The number of topics was set to 30 to maximize the number of topics associated with factors that could arise. These topics were reviewed manually, and the topics of interest related to factors were identified.</p>
          <fig id="figure3" position="float">
            <label>Figure 3</label>
            <caption>
              <p>Example of messages. (A) Causality term associated with right section. (B) Causality term associated with left section. The sections in which the topic model is applied are indicated in green.</p>
            </caption>
            <graphic xlink:href="jmir_v22i11e17247_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Data Set Description</title>
        <p>After cleaning and formatting, the obtained corpus contained 198,866 messages. A total of 36,989 different web users were associated with this corpus. A total of 29,935 messages (corresponding to 16,746 different web users) contained at least one of the extraction keywords, and 181,365 messages came from the <italic>Doctissimo</italic> subforums (<xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>).</p>
        <p>The most frequent keyword was <italic>abdominal pain,</italic> as presented in <xref ref-type="table" rid="table1">Table 1</xref>. The most frequently mentioned keywords were lay vocabulary: <italic>nausea</italic>, <italic>colic</italic>, <italic>vomiting</italic> and <italic>diarrhea</italic>. More expert terms such as <italic>irritable bowel syndrome</italic>, <italic>irritable bowel,</italic> or <italic>dyspepsia</italic> were used less frequently.</p>
        <p>Messages were retrieved from 14 different generalized and specialized web forums. Extracted data mostly came from <italic>Doctissimo</italic> (182,647/198,866, 91.84% of messages; 27,415/36,989, 74.12% of users). The most frequently used data sources were <italic>Aufeminin</italic> (2325/36,989, 6.29% of web users), <italic>Sante-medecine</italic> (1375/36,989, 3.72% of web users), <italic>Atoute.org</italic> (1350/36,989, 3.65% of web users) and <italic>Onmeda</italic> (1341/36,989, 3.63% of web users).</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Most frequently used extraction keywords.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="370"/>
            <col width="270"/>
            <col width="360"/>
            <thead>
              <tr valign="top">
                <td>Keyword extraction (top 20)</td>
                <td>English translation</td>
                <td>Number of messages, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Mal au ventre</td>
                <td>Abdominal pain</td>
                <td>9011 (4.53)</td>
              </tr>
              <tr valign="top">
                <td>Nausée</td>
                <td>Nausea</td>
                <td>2571 (1.29)</td>
              </tr>
              <tr valign="top">
                <td>Colique</td>
                <td>Colic</td>
                <td>1795 (0.90)</td>
              </tr>
              <tr valign="top">
                <td>Vomissement</td>
                <td>Vomiting</td>
                <td>1722 (0.87)</td>
              </tr>
              <tr valign="top">
                <td>Gargouillis</td>
                <td>Borborygmi</td>
                <td>1698 (0.85)</td>
              </tr>
              <tr valign="top">
                <td>Diarrhée</td>
                <td>Diarrhea</td>
                <td>1642 (0.83)</td>
              </tr>
              <tr valign="top">
                <td>Ballonnement</td>
                <td>Bloating</td>
                <td>1548 (0.78)</td>
              </tr>
              <tr valign="top">
                <td>Constipation</td>
                <td>Constipation</td>
                <td>1352 (0.68)</td>
              </tr>
              <tr valign="top">
                <td>Des gaz</td>
                <td>Gas</td>
                <td>1070 (0.54)</td>
              </tr>
              <tr valign="top">
                <td>Rot</td>
                <td>Burp</td>
                <td>996 (0.50)</td>
              </tr>
              <tr valign="top">
                <td>Pet</td>
                <td>Fart</td>
                <td>847 (0.43)</td>
              </tr>
              <tr valign="top">
                <td>Colopathe</td>
                <td>IBS<sup>a</sup></td>
                <td>837 (0.42)</td>
              </tr>
              <tr valign="top">
                <td>Colopathie fonctionnelle</td>
                <td>IBS</td>
                <td>757 (0.38)</td>
              </tr>
              <tr valign="top">
                <td>Côlon irritable</td>
                <td>Irritable bowel</td>
                <td>609 (0.31)</td>
              </tr>
              <tr valign="top">
                <td>Problèmes intestinaux</td>
                <td>Bowel problems</td>
                <td>599 (0.30)</td>
              </tr>
              <tr valign="top">
                <td>Reflux gastrique</td>
                <td>Acid reflux</td>
                <td>488 (0.25)</td>
              </tr>
              <tr valign="top">
                <td>Selles molles</td>
                <td>Loose stools</td>
                <td>452 (0.23)</td>
              </tr>
              <tr valign="top">
                <td>Chiasse</td>
                <td>Runs</td>
                <td>402 (0.20)</td>
              </tr>
              <tr valign="top">
                <td>Flatulence</td>
                <td>Flatulence</td>
                <td>364 (0.18)</td>
              </tr>
              <tr valign="top">
                <td>Dyspepsie</td>
                <td>Dyspepsia</td>
                <td>338 (0.17)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>IBS: irritable bowel syndrome.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Discussion Themes and Topics</title>
        <p>A total of 18 topics of interest were identified on the basis of manual labeling and review of the data (<xref ref-type="table" rid="table2">Table 2</xref>). Although the most discussed topic was related to everyday life, the second most discussed topic was related to diet.</p>
        <p>Topics were gathered into 6 main groups of clusters on their correlations: <italic>consultations, diet, symptoms, quality of life, treatments</italic> and <italic>stress and symptoms</italic>. The <italic>symptoms</italic> category was further subdivided into 3 subcategories: <italic>abdominal pain, GERD,</italic> and <italic>digestion</italic>. The 8 derived categories were used for user segmentation.</p>
        <p>A second topic model was applied to the messages from the group of topics <italic>diet</italic>. This focus allowed the identification of a constellation of subtopics related to symptoms associated with diet (<italic>nausea and vomiting, bloating and gastric reflux</italic>), to the importance of adapting diet to avoid troubles (<italic>diet as a solution to gastric troubles, recipes, balance in diet and efficiency of modifying the diet</italic>), and to food intolerance <italic>and intestinal microbiota (gluten, dairy products and intestinal flora</italic>). This subtopic was rising in 2017 (ie, the relative number and number of posts discussing this topic), which is the last complete year of the analysis corpus.</p>
        <p>Another topic model was applied to messages from the group of topics <italic>stress and symptoms</italic>. The main identified subtopic was addressing solutions to stress (<italic>sport, courage</italic> and <italic>anxiety</italic>). Other identified subtopics revealed a complex relationship between stress and symptoms of GI discomfort, as some subtopics were presenting GI symptoms as a cause of stress (<italic>impact on social life and persistent gastric symptoms</italic>) and stress as a cause of GI symptoms (<italic>because of stress and pain because of problems</italic>), sometimes during specific periods (<italic>GI symptoms flare during exams or depending on the menstrual cycle</italic>).</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>List of modeled and merged topics.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="360"/>
            <col width="220"/>
            <col width="190"/>
            <col width="230"/>
            <thead>
              <tr valign="top">
                <td>Topics</td>
                <td>Number of messages, n (%)</td>
                <td>Number of users, n (%)</td>
                <td>Group</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Prediagnosis medical consultations</td>
                <td>4752 (2.39)</td>
                <td>2095 (5.66)</td>
                <td>Medical consultations</td>
              </tr>
              <tr valign="top">
                <td>Examinations for diagnostic purposes</td>
                <td>3183 (1.60)</td>
                <td>1283 (3.47)</td>
                <td>Medical consultations</td>
              </tr>
              <tr valign="top">
                <td>Postdiagnosis medical consultations</td>
                <td>2795 (1.41)</td>
                <td>1422 (3.84)</td>
                <td>Medical consultations</td>
              </tr>
              <tr valign="top">
                <td>Medical examinations</td>
                <td>6852 (3.45)</td>
                <td>4013 (10.85)</td>
                <td>Medical consultations</td>
              </tr>
              <tr valign="top">
                <td>Diet</td>
                <td>12,802 (6.44)</td>
                <td>4727 (12.78)</td>
                <td>Diet</td>
              </tr>
              <tr valign="top">
                <td>Food and IBS<sup>a</sup></td>
                <td>2211 (1.11)</td>
                <td>988 (2.67)</td>
                <td>Diet</td>
              </tr>
              <tr valign="top">
                <td>Abdominal pain and nausea</td>
                <td>12,385 (6.23)</td>
                <td>6939 (18.76)</td>
                <td>Symptoms—abdominal pain</td>
              </tr>
              <tr valign="top">
                <td>Abdominal pain</td>
                <td>8370 (4.21)</td>
                <td>4130 (11.17)</td>
                <td>Symptoms—abdominal pain</td>
              </tr>
              <tr valign="top">
                <td>Gastroesophageal reflux disease</td>
                <td>2001 (1.01)</td>
                <td>672 (1.82)</td>
                <td>Symptoms—GERD<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Gastroesophageal reflux disease and heartburn</td>
                <td>6202 (3.12)</td>
                <td>2337 (6.32)</td>
                <td>Symptoms—GERD</td>
              </tr>
              <tr valign="top">
                <td>IBS<sup>a</sup></td>
                <td>2538 (1.28)</td>
                <td>1061 (2.87)</td>
                <td>Symptoms—Digestion</td>
              </tr>
              <tr valign="top">
                <td>Digestion</td>
                <td>12,521 (6.30)</td>
                <td>5290 (14.30)</td>
                <td>Symptoms—Digestion</td>
              </tr>
              <tr valign="top">
                <td>Digestive disorders in children</td>
                <td>4520 (2.27)</td>
                <td>2216 (5.99)</td>
                <td>Symptoms—Digestion</td>
              </tr>
              <tr valign="top">
                <td>Impact on everyday life</td>
                <td>8628 (4.34)</td>
                <td>3672 (9.93)</td>
                <td>Quality of life</td>
              </tr>
              <tr valign="top">
                <td>Everyday life</td>
                <td>16,176 (8.13)</td>
                <td>5902 (15.96)</td>
                <td>Quality of life</td>
              </tr>
              <tr valign="top">
                <td>Medication efficiency</td>
                <td>6240 (3.14)</td>
                <td>2825 (7.64)</td>
                <td>Treatments</td>
              </tr>
              <tr valign="top">
                <td>Information about the treatments</td>
                <td>1561 (0.78)</td>
                <td>856 (2.31)</td>
                <td>Treatments</td>
              </tr>
              <tr valign="top">
                <td>Stress and symptoms</td>
                <td>5679 (2.86)</td>
                <td>2971 (8.03)</td>
                <td>Stress and symptoms</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>IBS: irritable bowel syndrome.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>GERD: gastroesophageal reflux disease.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>User Segmentation</title>
        <p>The algorithms based on regular expressions identified the gender for 14,441 users and the age for 4802 users. These results are presented in <xref ref-type="table" rid="table3">Table 3</xref>. The sex ratio was 0.20.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Users’ characteristics: number of web users and relative number of web users (among 36,989 users).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="280"/>
            <col width="250"/>
            <col width="200"/>
            <col width="270"/>
            <thead>
              <tr valign="top">
                <td>Age range (years)</td>
                <td>Women, n (%)</td>
                <td>Men, n (%)</td>
                <td>Unknown, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>0-20</td>
                <td>569 (1.54)</td>
                <td>117 (0.32)</td>
                <td>715 (1.93)</td>
              </tr>
              <tr valign="top">
                <td>21-30</td>
                <td>997 (2.70)</td>
                <td>195 (0.53)</td>
                <td>691 (1.87)</td>
              </tr>
              <tr valign="top">
                <td>31-40</td>
                <td>466 (1.26)</td>
                <td>87 (0.24)</td>
                <td>272 (0.74)</td>
              </tr>
              <tr valign="top">
                <td>41-50</td>
                <td>227 (0.61)</td>
                <td>41 (0.11)</td>
                <td>128 (0.35)</td>
              </tr>
              <tr valign="top">
                <td>41-60</td>
                <td>123 (0.33)</td>
                <td>19 (0.05)</td>
                <td>69 (0.19)</td>
              </tr>
              <tr valign="top">
                <td>61 and over</td>
                <td>42 (0.11)</td>
                <td>13 (0.04)</td>
                <td>31 (0.08)</td>
              </tr>
              <tr valign="top">
                <td>Unknown</td>
                <td>9647 (26.08)</td>
                <td>1898 (5.13)</td>
                <td>20,642 (55.81)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>A total of 12.98% (4802/36,989) of the users were characterized according to their age range (62,146/198,866, 31.25% of the messages), and 39.04% (14,441/36,989) of the users were characterized according to their gender (118,882/198,866, 59.78% of the messages). The nonsupervised, bottom-up, hierarchical clustering exhibited 16 different clusters according to the segmentation features presented in <xref ref-type="supplementary-material" rid="app5">Multimedia Appendix 5</xref>. After clustering, the expression of these features enabled the visual identification of the expression of the features in a heatmap, which is presented in <xref rid="figure4" ref-type="fig">Figure 4</xref>. A review of this heatmap enabled the manual identification of clusters that are presented in <xref ref-type="table" rid="table4">Table 4</xref>. These clusters were labeled according to the expressed features, and only clusters of more than 100 web users were considered. Clusters are generally characterized by types of symptoms or diagnosed diseases (GERD, digestive disorders, stress and abdominal pain).</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Heatmap presenting the results of the hierarchical clustering of web users on the basis of the discussed topics, symptoms, and activity on websites. GERD: gastroesophageal reflux disease.</p>
          </caption>
          <graphic xlink:href="jmir_v22i11e17247_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>List of main clusters of web users that were identified (36,989 users).<sup>a</sup></p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="770"/>
            <col width="230"/>
            <thead>
              <tr valign="top">
                <td>Cluster name</td>
                <td>Number of users, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Pains and vomiting, stress and abdominal pain</td>
                <td>8026 (21.70)</td>
              </tr>
              <tr valign="top">
                <td>Gastro intestinal disorders associated with diet, digestive disorders, and stress</td>
                <td>1962 (5.30)</td>
              </tr>
              <tr valign="top">
                <td>GERD<sup>b</sup></td>
                <td>1117 (3.02)</td>
              </tr>
              <tr valign="top">
                <td>Borborygmi and abdominal pain</td>
                <td>711 (1.92)</td>
              </tr>
              <tr valign="top">
                <td>Crohn disease</td>
                <td>256 (0.69)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>Clusters were named according to the features that were expressed in users’ messages.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>GERD: gastroesophageal reflux disease.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Two clusters were strongly associated with GI disorders. These 2 clusters were also associated with the groups of topics<italic>, stress, symptoms,</italic> and <italic>diet</italic>. Three clusters were strongly associated with pain, vomiting, and groups of topics<italic>: stress and symptoms</italic> and <italic>symptoms—abdominal pain</italic>. These clusters were associated with a younger population. More generally, clusters associated with undiagnosed symptoms were often associated with the <italic>Stress</italic> topic, whereas clusters associated with diagnosed diseases (GERD and Crohn disease) seemed to be associated with fewer stress features. The 4 clusters associated with the <italic>Diet</italic> topic were also associated with the group of topics <italic>stress and symptoms</italic>.</p>
      </sec>
      <sec>
        <title>Factors of GI Discomfort</title>
        <p>The causality dictionary contained 170 terms. These causality terms were searched in the analysis corpus subset containing extraction keywords (29,935 messages). A total of 20,500 messages (corresponding to 10,848 users) were identified, and a new topic model was applied. The characteristic tokens and a sample of characteristic messages associated with each topic were manually reviewed to identify the themes addressed and the topics related to the causes of GI discomfort. In total, 10 topics of interest arose and were manually labeled and grouped according to the type of factors they expressed. This led to the identification of 7 different types of factors. The proportion of messages associated with these factors was calculated (<xref ref-type="table" rid="table5">Table 5</xref>). The factors that were mostly perceived by web users were related to the <italic>psychological context</italic> (psychological and social factors), followed by <italic>diet</italic> (nutritional factors and allergens or food intolerances) and <italic>medical factors</italic> (GI diseases, gynecological factors, and medical complications).</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Perceived factors of gastrointestinal discomfort. Proportions are calculated among the messages with causality terms (20,500 messages).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="630"/>
            <col width="340"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Factors and topics</td>
                <td>Messages, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">
                  <bold>Psychological factors</bold>
                </td>
                <td>4327 (21.11)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Stress</td>
                <td>2548 (12.43)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Anxiety</td>
                <td>2374 (11.58)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Nutritional factors</td>
                <td>3224 (15.73)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Allergens</td>
                <td>2857 (13.94)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Diagnosed gastrointestinal diseases</bold>
                </td>
                <td>2697 (13.16)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Digestive disorders</td>
                <td>1516 (7.40)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Medical examinations</td>
                <td>1296 (6.32)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <bold>Gynecological factors</bold>
                </td>
                <td>1898 (9.26)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Obstetrical factors</td>
                <td>1005 (4.90)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Gynecological factors</td>
                <td>980 (4.78)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Social factors</td>
                <td>1568 (7.65)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">Medical complications</td>
                <td>1070 (5.22)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>GI discomfort is actively discussed in French web forums, as shown in this study, which enabled the identification of 198,866 messages. In a subcorpus of web users who we were able to characterize according to age and gender, mostly women aged below 40 years were represented (<xref ref-type="table" rid="table3">Table 3</xref>). The gender and age distribution of most active users tended to mirror the higher prevalence of DGBIs such as IBS in younger women [<xref ref-type="bibr" rid="ref47">47</xref>].</p>
        <p>Users described how they were adapting their diet to avoid symptoms linked to perceived food intolerance (<italic>gluten and dairy products</italic>) associated with gut microbiota (<italic>intestinal flora</italic>). This is in line with the increasing number of reports in the literature about the controversial concept of nonceliac gluten sensitivity [<xref ref-type="bibr" rid="ref48">48</xref>].</p>
        <p>As stress was reported by users as both the cause and consequence of their GI symptoms, a focus on the <italic>stress and symptoms</italic> group revealed discussion topics related to the impact of stress on quality of life and solutions to reduce stress, such as physical activity. The role of psychological factors such as anxiety in eliciting or worsening GI symptoms is well established in the literature, both in the general population and in patients affected by DGBIs [<xref ref-type="bibr" rid="ref49">49</xref>].</p>
        <p>User segmentation led to the identification of 16 different classes, grouped into 6 main clusters. The classes associated with symptoms were generally associated with stress, with a stronger association in the case of abdominal pain. The 3 clusters associated with abdominal pain (attributed to diet or digestion) were associated with a younger population. In addition, in all groups of users reporting diet-related features, <italic>Stress</italic> and <italic>Symptoms</italic> topics were also expressed. This suggests a complex relationship between diet, stress, and symptoms of GI discomfort in a real-life setting. We believe that these results may appeal to researchers collecting dietary parameters in nutrition and clinical studies, as the monitoring of dietary intake and habits is important in prospective medical research studies [<xref ref-type="bibr" rid="ref50">50</xref>]. Indeed, further context on meal intake (such as social and emotional context) should be collected to ensure that eating behavior and associated sentiments are accounted for. In a recent review, it was highlighted that emotion tracking is a lacking feature in most downloaded smartphone apps that are used for dietary assessment [<xref ref-type="bibr" rid="ref51">51</xref>]. However, these tools could include features that may be used to examine emotions associated with meals in an observational setting at the population level. Such features would also be important to obtain further information on background diet, which is important when evaluating the efficacy of food and dietary interventions in research [<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>], especially in patients with DGBIs [<xref ref-type="bibr" rid="ref54">54</xref>].</p>
        <p>Our analysis identified 7 categories of factors of GI discomfort (psychological, nutritional, allergens, diagnosed GI diseases, gynecological, social, and medical complications), showing that food and psychological factors are perceived by web users as the major causes of GI discomfort. Identification of perceived factors revealed complex associations between food and health parameters. As an example, the use of <italic>fibres</italic> (fibers) keyword revealed a contrasted perception by web users, fibers being seen both as a solution to and cause of GI discomfort (associated with nutritional factors). As noted by another research team analyzing bowel disease–related tweets [<xref ref-type="bibr" rid="ref55">55</xref>], web-based messages about foods and diet (in this case fiber, iron and magnesium) can be positively or negatively perceived depending on the conditions of web users. Regarding other keywords representing factors of food origin, milk, gluten, and fruits were some of the most frequently used terms.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>The results of another study aimed at characterizing the inflammatory bowel disease community based on Twitter discussions during an 8-month period were published while this paper was being prepared [<xref ref-type="bibr" rid="ref55">55</xref>]. This research team also identified that web users shared their experiences and looked for medical advice and that users’ discussions were mainly about inflammatory bowel disease symptoms, related diseases (including anxiety disorders), and foods and diets (including dietary interventions, such as gluten-free and probiotics). These findings are consistent with the main discussion topics that we identified in our corpus, even though the media source (tweets) and language (English) were different, and the studied indication (inflammatory bowel disease) was more specific for this study.</p>
        <p>Recently, the smartphone app, <italic>My Symptoms</italic> [<xref ref-type="bibr" rid="ref56">56</xref>], was completed by 163 participants to track food intake, psychological distress and GI symptoms in a research study aiming to identify the associations between these parameters. The results of this study were recently published by the research team [<xref ref-type="bibr" rid="ref57">57</xref>], which described strong symptom-symptom associations, especially abdominal pain, bloating, gas-related discomfort, and psychological distress. All these parameters are topics or subtopics that were identified in our study; at the same time, we also noted an association between abdominal pain and stress.</p>
        <p>We identified that topics related to medical consultations and medical examinations were frequently discussed, suggesting an important use of the health care system due to GI disorders, which is consistent with prior work [<xref ref-type="bibr" rid="ref17">17</xref>]. When this paper was drafted, results of another study relying on another source of real-world information, the French National Health Data System (<italic>Système National des Données de Santé</italic>) [<xref ref-type="bibr" rid="ref58">58</xref>], were published [<xref ref-type="bibr" rid="ref59">59</xref>]. This study aimed to assess health care use in a specific case of IBS. This study also revealed an important use of the health care system by patients with IBS, also interestingly suggesting an important medical nomadism for these patients in France.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>A limitation of this study is inherent to the particularities of web forums where web users do not necessarily reflect the characteristics of the general population. Although the important number of extracted messages could favor the variability of users’ characteristics, these results cannot be generalized to all patients affected by GI discomfort.</p>
        <p>An extraction bias is associated with the considered data sources and keywords selected for analysis. Moreover, information found in messages cannot be interpreted as it would be from a questionnaire. Handling missing information is a key example: the fact that a piece of information is not found in messages does not mean that users did not experience it. For these reasons, it can be difficult to draw conclusions in cases of missing or unclear data. Another example is the identification of the age and gender of web users, which is not possible if not indicated in the source and not systematically identified in our study.</p>
        <p>An additional limitation is the observational bias inherent to semantic analysis and natural language processing. The use of automatic analysis allows us to analyze a large amount of information but is subject to limitations arising from the abilities of the algorithms. Moreover, regarding topic models, the fact that topics must be manually labeled is also a source of bias.</p>
        <p>The processing of lay language as source data prevents us from drawing further conclusions on the identified factors of GI discomfort that would require a high level of knowledge from web users. These factors are, therefore, presented as <italic>perceived</italic> factors in this paper as the assessment of their relationship with symptoms of GI discomfort results from self-assessment by web users. In addition, this analysis revealed several misconceptions, especially about factors of food origin. For example, web users may discuss food-allergic reactions but may refer to symptoms that are unlikely to be mediated by the immune system or compounds that are not known to be the cause of allergic reactions but rather of hypersensitivity or intolerance (eg, lactose). This is consistent with the results of a population-based survey published during this study, concluding that population-estimated prevalence of allergy was twice as important as the one estimated by physicians [<xref ref-type="bibr" rid="ref60">60</xref>]. However, despite these limitations due to the analyses in lay language, our study confirmed a known and complex relationship between food, stress and psychological factors when considering online forums as a complementary source of real-world evidence.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>GI discomfort is an actively discussed topic in French web forums. When identified in a portion of active users, the gender and age of most active users tend to mirror the higher prevalence of DGBIs in women aged below 40 years. We were able to segment web users into several clusters corresponding to specific GI symptoms or diagnosed disorders and characterized by distinct demographic parameters and expression of variables related to stress. The main factors of GI discomfort as perceived by web users are food and psychological factors. This paper could benefit from a similar analysis based on additional sources to cover further languages (eg, English) to study the similarities and differences of the results at a larger scale and with different dietary and cultural backgrounds. To conclude, this innovative infodemiology approach has shown that identifying discussion topics associated with GI discomfort online is feasible and can serve as a complementary source of real-world evidence.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Corpus description.</p>
        <media xlink:href="jmir_v22i11e17247_app1.docx" xlink:title="DOCX File , 21 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Number of extracted messages and associated number of web users per data source.</p>
        <media xlink:href="jmir_v22i11e17247_app2.docx" xlink:title="DOCX File , 22 KB"/>
      </supplementary-material>
      <supplementary-material id="app3">
        <label>Multimedia Appendix 3</label>
        <p>List of keywords used for the extraction of messages.</p>
        <media xlink:href="jmir_v22i11e17247_app3.docx" xlink:title="DOCX File , 23 KB"/>
      </supplementary-material>
      <supplementary-material id="app4">
        <label>Multimedia Appendix 4</label>
        <p>List of features used for the segmentation of web users.</p>
        <media xlink:href="jmir_v22i11e17247_app4.docx" xlink:title="DOCX File , 21 KB"/>
      </supplementary-material>
      <supplementary-material id="app5">
        <label>Multimedia Appendix 5</label>
        <p>List of anatomical regions and pathophysiological mechanisms used for the segmentation of users.</p>
        <media xlink:href="jmir_v22i11e17247_app5.docx" xlink:title="DOCX File , 20 KB"/>
      </supplementary-material>
      <supplementary-material id="app6">
        <label>Multimedia Appendix 6</label>
        <p>List of causality terms used for the identification of perceived factors.</p>
        <media xlink:href="jmir_v22i11e17247_app6.docx" xlink:title="DOCX File , 28 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">DGBI</term>
          <def>
            <p>disorders of gut-brain interaction</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">GERD</term>
          <def>
            <p>gastroesophageal reflux disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">GI</term>
          <def>
            <p>gastrointestinal</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">IBS</term>
          <def>
            <p>irritable bowel syndrome</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">LDA</term>
          <def>
            <p>latent Dirichlet allocation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">MedDRA</term>
          <def>
            <p>Medical Dictionary for Regulatory Activities</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">TF-IDF</term>
          <def>
            <p>term frequency-inverse document frequency</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was funded by Danone Nutricia Research.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>FS, JJ, and BL are the employees of Danone Nutricia Research. GF received consulting fees from Danone Nutricia Research.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Locke</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Choung</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Zinsmeister</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Schleck</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Talley</surname>
              <given-names>NJ</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and risk factors for abdominal bloating and visible distention: a population-based study</article-title>
          <source>Gut</source>
          <year>2008</year>
          <month>06</month>
          <volume>57</volume>
          <issue>6</issue>
          <fpage>756</fpage>
          <lpage>63</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/18477677"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/gut.2007.142810</pub-id>
          <pub-id pub-id-type="medline">18477677</pub-id>
          <pub-id pub-id-type="pii">57/6/756</pub-id>
          <pub-id pub-id-type="pmcid">PMC2581929</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tielemans</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Jaspers Focks</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>van Rossum</surname>
              <given-names>LG</given-names>
            </name>
            <name name-style="western">
              <surname>Eikendal</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Jansen</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Laheij</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>van Oijen</surname>
              <given-names>MG</given-names>
            </name>
          </person-group>
          <article-title>Gastrointestinal symptoms are still prevalent and negatively impact health-related quality of life: a large cross-sectional population based study in The Netherlands</article-title>
          <source>PLoS One</source>
          <year>2013</year>
          <volume>8</volume>
          <issue>7</issue>
          <fpage>e69876</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0069876"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0069876</pub-id>
          <pub-id pub-id-type="medline">23922836</pub-id>
          <pub-id pub-id-type="pii">PONE-D-13-11542</pub-id>
          <pub-id pub-id-type="pmcid">PMC3726702</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schmulson</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Drossman</surname>
              <given-names>DA</given-names>
            </name>
          </person-group>
          <article-title>What is new in Rome IV</article-title>
          <source>J Neurogastroenterol Motil</source>
          <year>2017</year>
          <month>04</month>
          <day>30</day>
          <volume>23</volume>
          <issue>2</issue>
          <fpage>151</fpage>
          <lpage>63</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jnmjournal.org/journal/view.html?doi=10.5056/jnm16214"/>
          </comment>
          <pub-id pub-id-type="doi">10.5056/jnm16214</pub-id>
          <pub-id pub-id-type="medline">28274109</pub-id>
          <pub-id pub-id-type="pii">jnm16214</pub-id>
          <pub-id pub-id-type="pmcid">PMC5383110</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lovell</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Ford</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>Global prevalence of and risk factors for irritable bowel syndrome: a meta-analysis</article-title>
          <source>Clin Gastroenterol Hepatol</source>
          <year>2012</year>
          <month>07</month>
          <volume>10</volume>
          <issue>7</issue>
          <fpage>712</fpage>
          <lpage>21.e4</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cgh.2012.02.029</pub-id>
          <pub-id pub-id-type="medline">22426087</pub-id>
          <pub-id pub-id-type="pii">S1542-3565(12)00308-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sperber</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Dumitrascu</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Fukudo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gerson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ghoshal</surname>
              <given-names>UC</given-names>
            </name>
            <name name-style="western">
              <surname>Gwee</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Hungin</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Minhu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schmulson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bolotin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Friger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Freud</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Whitehead</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>The global prevalence of IBS in adults remains elusive due to the heterogeneity of studies: a Rome Foundation working team literature review</article-title>
          <source>Gut</source>
          <year>2017</year>
          <month>06</month>
          <volume>66</volume>
          <issue>6</issue>
          <fpage>1075</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="doi">10.1136/gutjnl-2015-311240</pub-id>
          <pub-id pub-id-type="medline">26818616</pub-id>
          <pub-id pub-id-type="pii">gutjnl-2015-311240</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pen</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Ruszniewski</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Gaudin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Amouretti</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bommelaer</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Frexinos</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Poynard</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Maurel</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Priol</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bertin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>The burden cost of French patients suffering from irritable bowel syndrome</article-title>
          <source>Scand J Gastroenterol</source>
          <year>2004</year>
          <month>04</month>
          <volume>39</volume>
          <issue>4</issue>
          <fpage>336</fpage>
          <lpage>43</lpage>
          <pub-id pub-id-type="doi">10.1080/00365520310008458</pub-id>
          <pub-id pub-id-type="medline">15125465</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Frändemark</surname>
              <given-names>Å</given-names>
            </name>
            <name name-style="western">
              <surname>Törnblom</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jakobsson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Simrén</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Work productivity and activity impairment in irritable bowel syndrome (IBS): a multifaceted problem</article-title>
          <source>Am J Gastroenterol</source>
          <year>2018</year>
          <month>10</month>
          <volume>113</volume>
          <issue>10</issue>
          <fpage>1540</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1038/s41395-018-0262-x</pub-id>
          <pub-id pub-id-type="medline">30254230</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Canavan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>West</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Card</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Review article: the economic impact of the irritable bowel syndrome</article-title>
          <source>Aliment Pharmacol Ther</source>
          <year>2014</year>
          <month>11</month>
          <volume>40</volume>
          <issue>9</issue>
          <fpage>1023</fpage>
          <lpage>34</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1111/apt.12938"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/apt.12938</pub-id>
          <pub-id pub-id-type="medline">25199904</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cogliandro</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Antonucci</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>de Giorgio</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Barbara</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cremon</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cogliandro</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Frisoni</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pezzilli</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Morselli-Labate</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Corinaldesi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Stanghellini</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Patient-reported outcomes and gut dysmotility in functional gastrointestinal disorders</article-title>
          <source>Neurogastroenterol Motil</source>
          <year>2011</year>
          <month>12</month>
          <volume>23</volume>
          <issue>12</issue>
          <fpage>1084</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1365-2982.2011.01783.x</pub-id>
          <pub-id pub-id-type="medline">21917083</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Posserud</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Syrous</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lindström</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tack</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Abrahamsson</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Simrén</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Altered rectal perception in irritable bowel syndrome is associated with symptom severity</article-title>
          <source>Gastroenterology</source>
          <year>2007</year>
          <month>10</month>
          <volume>133</volume>
          <issue>4</issue>
          <fpage>1113</fpage>
          <lpage>23</lpage>
          <pub-id pub-id-type="doi">10.1053/j.gastro.2007.07.024</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bennet</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Polster</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Törnblom</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Isaksson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Capronnier</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tessier</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Le Nevé</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Simrén</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Öhman</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Global cytokine profiles and association with clinical characteristics in patients with irritable bowel syndrome</article-title>
          <source>Am J Gastroenterol</source>
          <year>2016</year>
          <month>08</month>
          <volume>111</volume>
          <issue>8</issue>
          <fpage>1165</fpage>
          <lpage>76</lpage>
          <pub-id pub-id-type="doi">10.1038/ajg.2016.223</pub-id>
          <pub-id pub-id-type="medline">27272011</pub-id>
          <pub-id pub-id-type="pii">ajg2016223</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dunlop</surname>
              <given-names>SP</given-names>
            </name>
            <name name-style="western">
              <surname>Hebden</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Naesdal</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Olbe</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Perkins</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Spiller</surname>
              <given-names>RC</given-names>
            </name>
          </person-group>
          <article-title>Abnormal intestinal permeability in subgroups of diarrhea-predominant irritable bowel syndromes</article-title>
          <source>Am J Gastroenterol</source>
          <year>2006</year>
          <month>06</month>
          <volume>101</volume>
          <issue>6</issue>
          <fpage>1288</fpage>
          <lpage>94</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1572-0241.2006.00672.x</pub-id>
          <pub-id pub-id-type="medline">16771951</pub-id>
          <pub-id pub-id-type="pii">AJG672</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tap</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Derrien</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Törnblom</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Brazeilles</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cools-Portier</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Doré</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Störsrud</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Le Nevé</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Öhman</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Simrén</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Identification of an intestinal microbiota signature associated with severity of irritable bowel syndrome</article-title>
          <source>Gastroenterology</source>
          <year>2017</year>
          <month>01</month>
          <volume>152</volume>
          <issue>1</issue>
          <fpage>111</fpage>
          <lpage>23.e8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0016-5085(16)35174-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1053/j.gastro.2016.09.049</pub-id>
          <pub-id pub-id-type="medline">27725146</pub-id>
          <pub-id pub-id-type="pii">S0016-5085(16)35174-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zvolensky</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jardin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Farris</surname>
              <given-names>SG</given-names>
            </name>
            <name name-style="western">
              <surname>Kauffman</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Bakhshaie</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Garey</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Mayorga</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Gut interpretations: how difficulties in emotion regulation may help explain the relation of visceral sensitivity with depression and anxiety among young adults with gastrointestinal symptoms</article-title>
          <source>Psychol Health Med</source>
          <year>2018</year>
          <month>08</month>
          <volume>23</volume>
          <issue>7</issue>
          <fpage>840</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1080/13548506.2018.1455984</pub-id>
          <pub-id pub-id-type="medline">29580068</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zamani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Alizadeh-Tabari</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zamani</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Systematic review with meta-analysis: the prevalence of anxiety and depression in patients with irritable bowel syndrome</article-title>
          <source>Aliment Pharmacol Ther</source>
          <year>2019</year>
          <month>07</month>
          <volume>50</volume>
          <issue>2</issue>
          <fpage>132</fpage>
          <lpage>43</lpage>
          <pub-id pub-id-type="doi">10.1111/apt.15325</pub-id>
          <pub-id pub-id-type="medline">31157418</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Enck</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Koehler</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Weigmann</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Mueller-Lissner</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Abdominal pain, cramping or discomfort impairs quality of life in women: an internet-based observational pilot study focussing on impact of treatment</article-title>
          <source>Z Gastroenterol</source>
          <year>2017</year>
          <month>03</month>
          <volume>55</volume>
          <issue>3</issue>
          <fpage>260</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1055/s-0043-100022</pub-id>
          <pub-id pub-id-type="medline">28288501</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brun-Strang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dapoigny</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lafuma</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wainsten</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Fagnani</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Irritable bowel syndrome in France: quality of life, medical management, and costs: the Encoli study</article-title>
          <source>Eur J Gastroenterol Hepatol</source>
          <year>2007</year>
          <month>12</month>
          <volume>19</volume>
          <issue>12</issue>
          <fpage>1097</fpage>
          <lpage>103</lpage>
          <pub-id pub-id-type="doi">10.1097/MEG.0b013e3282f1621b</pub-id>
          <pub-id pub-id-type="medline">17998835</pub-id>
          <pub-id pub-id-type="pii">00042737-200712000-00013</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ford</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Lacy</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Talley</surname>
              <given-names>NJ</given-names>
            </name>
          </person-group>
          <article-title>Irritable bowel syndrome</article-title>
          <source>N Engl J Med</source>
          <year>2017</year>
          <month>06</month>
          <day>29</day>
          <volume>376</volume>
          <issue>26</issue>
          <fpage>2566</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.1056/NEJMra1607547</pub-id>
          <pub-id pub-id-type="medline">28657875</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mahon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lifschitz</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Ludwig</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Thapar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Glanville</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Miqdady</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Saps</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Quak</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Wijnkoop</surname>
              <given-names>LI</given-names>
            </name>
            <name name-style="western">
              <surname>Edwards</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wood</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Szajewska</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>The costs of functional gastrointestinal disorders and related signs and symptoms in infants: a systematic literature review and cost calculation for England</article-title>
          <source>Br Med J Open</source>
          <year>2017</year>
          <month>11</month>
          <day>14</day>
          <volume>7</volume>
          <issue>11</issue>
          <fpage>e015594</fpage>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2016-015594</pub-id>
          <pub-id pub-id-type="medline">29138194</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2016-015594</pub-id>
          <pub-id pub-id-type="pmcid">PMC5695302</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>El-Salhy</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ostgaard</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gundersen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hatlebakk</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Hausken</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>The role of diet in the pathogenesis and management of irritable bowel syndrome (Review)</article-title>
          <source>Int J Mol Med</source>
          <year>2012</year>
          <month>05</month>
          <volume>29</volume>
          <issue>5</issue>
          <fpage>723</fpage>
          <lpage>31</lpage>
          <pub-id pub-id-type="doi">10.3892/ijmm.2012.926</pub-id>
          <pub-id pub-id-type="medline">22366773</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Monsbakken</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Vandvik</surname>
              <given-names>PO</given-names>
            </name>
            <name name-style="western">
              <surname>Farup</surname>
              <given-names>PG</given-names>
            </name>
          </person-group>
          <article-title>Perceived food intolerance in subjects with irritable bowel syndrome- etiology, prevalence and consequences</article-title>
          <source>Eur J Clin Nutr</source>
          <year>2006</year>
          <month>05</month>
          <volume>60</volume>
          <issue>5</issue>
          <fpage>667</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/sj.ejcn.1602367"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sj.ejcn.1602367</pub-id>
          <pub-id pub-id-type="medline">16391571</pub-id>
          <pub-id pub-id-type="pii">1602367</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McKenzie</surname>
              <given-names>YA</given-names>
            </name>
            <name name-style="western">
              <surname>Bowyer</surname>
              <given-names>RK</given-names>
            </name>
            <name name-style="western">
              <surname>Leach</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gulia</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Horobin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>O'Sullivan</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Pettitt</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Reeves</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>Seamark</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lomer</surname>
              <given-names>M</given-names>
            </name>
            <collab>(IBS Dietetic Guideline Review Group on behalf of Gastroenterology Specialist Group of the British Dietetic Association)</collab>
          </person-group>
          <article-title>British dietetic association systematic review and evidence-based practice guidelines for the dietary management of irritable bowel syndrome in adults (2016 update)</article-title>
          <source>J Hum Nutr Diet</source>
          <year>2016</year>
          <month>10</month>
          <volume>29</volume>
          <issue>5</issue>
          <fpage>549</fpage>
          <lpage>75</lpage>
          <pub-id pub-id-type="doi">10.1111/jhn.12385</pub-id>
          <pub-id pub-id-type="medline">27272325</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Halmos</surname>
              <given-names>EP</given-names>
            </name>
            <name name-style="western">
              <surname>Gibson</surname>
              <given-names>PR</given-names>
            </name>
          </person-group>
          <article-title>Controversies and reality of the FODMAP diet for patients with irritable bowel syndrome</article-title>
          <source>J Gastroenterol Hepatol</source>
          <year>2019</year>
          <month>07</month>
          <volume>34</volume>
          <issue>7</issue>
          <fpage>1134</fpage>
          <lpage>42</lpage>
          <pub-id pub-id-type="doi">10.1111/jgh.14650</pub-id>
          <pub-id pub-id-type="medline">30945376</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Whitfield</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Shulman</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>Treatment options for functional gastrointestinal disorders: from empiric to complementary approaches</article-title>
          <source>Pediatr Ann</source>
          <year>2009</year>
          <month>05</month>
          <volume>38</volume>
          <issue>5</issue>
          <fpage>288</fpage>
          <lpage>90, 92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/19476303"/>
          </comment>
          <pub-id pub-id-type="medline">19476303</pub-id>
          <pub-id pub-id-type="pmcid">PMC2830707</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Duggan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Health Online</article-title>
          <source>Pew Research Center</source>
          <year>2013</year>
          <month>01</month>
          <day>15</day>
          <access-date>2018-02-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pewinternet.org/2013/01/15/health-online-2013/">http://www.pewinternet.org/2013/01/15/health-online-2013/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Baharudin</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>A review of machine learning algorithms for text-documents classification</article-title>
          <source>JAIT</source>
          <year>2010</year>
          <month>02</month>
          <day>1</day>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>-</fpage>
          <pub-id pub-id-type="doi">10.4304/jait.1.1.4-20</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Speier</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Arnold</surname>
              <given-names>CW</given-names>
            </name>
          </person-group>
          <article-title>Using phrases and document metadata to improve topic modeling of clinical reports</article-title>
          <source>J Biomed Inform</source>
          <year>2016</year>
          <month>06</month>
          <volume>61</volume>
          <fpage>260</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(16)30028-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2016.04.005</pub-id>
          <pub-id pub-id-type="medline">27109931</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(16)30028-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC4902330</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rashid</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Koblick</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>GD</given-names>
            </name>
            <name name-style="western">
              <surname>Cheetham</surname>
              <given-names>TC</given-names>
            </name>
          </person-group>
          <article-title>Using natural language processing and machine learning to identify gout flares from electronic clinical notes</article-title>
          <source>Arthritis Care Res (Hoboken)</source>
          <year>2014</year>
          <month>11</month>
          <volume>66</volume>
          <issue>11</issue>
          <fpage>1740</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1002/acr.22324"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/acr.22324</pub-id>
          <pub-id pub-id-type="medline">24664671</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Benton</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Leonard</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Hennessy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Holmes</surname>
              <given-names>JH</given-names>
            </name>
          </person-group>
          <article-title>Online discussion of drug side effects and discontinuation among breast cancer survivors</article-title>
          <source>Pharmacoepidemiol Drug Saf</source>
          <year>2013</year>
          <month>03</month>
          <volume>22</volume>
          <issue>3</issue>
          <fpage>256</fpage>
          <lpage>62</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23322591"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/pds.3365</pub-id>
          <pub-id pub-id-type="medline">23322591</pub-id>
          <pub-id pub-id-type="pmcid">PMC4380018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Faviez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schuck</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lillo-Le-Louët</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Texier</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dahamna</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Huot</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Foulquié</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Pereira</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Leroux</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Karapetiantz</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Guenegou-Arnoux</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Katsahian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bousquet</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Burgun</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Mining patients' narratives in social media for pharmacovigilance: adverse effects and misuse of methylphenidate</article-title>
          <source>Front Pharmacol</source>
          <year>2018</year>
          <volume>9</volume>
          <fpage>541</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.3389/fphar.2018.00541"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fphar.2018.00541</pub-id>
          <pub-id pub-id-type="medline">29881351</pub-id>
          <pub-id pub-id-type="pmcid">PMC5978246</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Foulquié</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Voillot</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Faviez</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Mebarki</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Texier</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Schück</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Étude de l’usage du méthylphénidate sur les réseaux sociaux</article-title>
          <source>Revue d'Épidémiologie et de Santé Publique</source>
          <year>2018</year>
          <month>06</month>
          <volume>66</volume>
          <fpage>S225</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.respe.2018.04.030"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.respe.2018.04.030</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schück</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Foulquié</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mebarki</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Voillot</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Texier</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Faviez</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Détection automatique du mésusage des neuroleptiques dans le trouble anxieux et la démence à partir des réseaux sociaux</article-title>
          <source>Revue d'Épidémiologie et de Santé Publique</source>
          <year>2018</year>
          <month>06</month>
          <volume>66</volume>
          <fpage>S211</fpage>
          <lpage>2</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.respe.2018.04.048"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.respe.2018.04.048</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schück</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Voillot</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Foulquié</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Faviez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mebarki</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Texier</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gauvain</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Que nous apportent les réseaux sociaux quant à la crise sanitaire du levothyrox d’aoû<italic>t</italic> 2017</article-title>
          <source>Revue d'Épidémiologie et de Santé Publique</source>
          <year>2018</year>
          <month>06</month>
          <fpage>s225</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1016/j.respe.2018.04.029"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.respe.2018.04.029</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fagherazzi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ravaud</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Digital diabetes: perspectives for diabetes prevention, management and research</article-title>
          <source>Diabetes Metab</source>
          <year>2019</year>
          <month>09</month>
          <volume>45</volume>
          <issue>4</issue>
          <fpage>322</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.diabet.2018.08.012</pub-id>
          <pub-id pub-id-type="medline">30243616</pub-id>
          <pub-id pub-id-type="pii">S1262-3636(18)30171-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Golder</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmed</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Norman</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Booth</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Attitudes toward the ethics of research using social media: a systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>06</month>
          <day>6</day>
          <volume>19</volume>
          <issue>6</issue>
          <fpage>e195</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/6/e195/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.7082</pub-id>
          <pub-id pub-id-type="medline">28588006</pub-id>
          <pub-id pub-id-type="pii">v19i6e195</pub-id>
          <pub-id pub-id-type="pmcid">PMC5478799</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <source>Doctissimo Forums</source>
          <year>2020</year>
          <access-date>2020-10-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://archive.today/SCVBL">http://archive.today/SCVBL</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abdellaoui</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Schück</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Texier</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Burgun</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Filtering entities to optimize identification of adverse drug reaction from social media: how can the number of words between entities in the messages help?</article-title>
          <source>J Med Internet Res Public Health Surveill</source>
          <year>2017</year>
          <month>06</month>
          <day>22</day>
          <volume>3</volume>
          <issue>2</issue>
          <fpage>e36</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2017/2/e36/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.6577</pub-id>
          <pub-id pub-id-type="medline">28642212</pub-id>
          <pub-id pub-id-type="pii">v3i2e36</pub-id>
          <pub-id pub-id-type="pmcid">PMC5500778</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kürzinger</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Schück</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Texier</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Abdellaoui</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Faviez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pouget</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Tcherny-Lessenot</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Juhaeri</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Web-based signal detection using medical forums data in france: comparative analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2018</year>
          <month>11</month>
          <day>20</day>
          <volume>20</volume>
          <issue>11</issue>
          <fpage>e10466</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2018/11/e10466/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/10466</pub-id>
          <pub-id pub-id-type="medline">30459145</pub-id>
          <pub-id pub-id-type="pii">v20i11e10466</pub-id>
          <pub-id pub-id-type="pmcid">PMC6280030</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Najork</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Web Crawler Architecture</article-title>
          <source>Encyclopedia of Database Systems</source>
          <access-date>2020-10-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1007/978-0-387-39940-9_457">https://doi.org/10.1007/978-0-387-39940-9_457</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ghosh</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Guha</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>What are we 'tweeting' about obesity? Mapping tweets with topic modeling and geographic information system</article-title>
          <source>Cartogr Geogr Inf Sci</source>
          <year>2013</year>
          <volume>40</volume>
          <issue>2</issue>
          <fpage>90</fpage>
          <lpage>102</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25126022"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/15230406.2013.776210</pub-id>
          <pub-id pub-id-type="medline">25126022</pub-id>
          <pub-id pub-id-type="pmcid">PMC4128420</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Paul</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Dredze</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Discovering health topics in social media using topic models</article-title>
          <source>PLoS One</source>
          <year>2014</year>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>e103408</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0103408"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0103408</pub-id>
          <pub-id pub-id-type="medline">25084530</pub-id>
          <pub-id pub-id-type="pii">PONE-D-14-00554</pub-id>
          <pub-id pub-id-type="pmcid">PMC4118877</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yesha</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gangopadhyay</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A Method for Analyzing Health Behavior in Online Forums</article-title>
          <source>Proceedings of the 6th ACM Conference on Bioinformatics, Computational Biology and Health Informatics</source>
          <year>2015</year>
          <conf-name>BCB'15</conf-name>
          <conf-date>September, 2015</conf-date>
          <conf-loc>Atlanta, Georgia</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2808719.2812592</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tapi Nzali</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Bringay</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lavergne</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mollevi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Opitz</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>What patients can tell us: topic analysis for social media on breast cancer</article-title>
          <source>J Med Internet Res Med Inform</source>
          <year>2017</year>
          <month>07</month>
          <day>31</day>
          <volume>5</volume>
          <issue>3</issue>
          <fpage>e23</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2017/3/e23/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/medinform.7779</pub-id>
          <pub-id pub-id-type="medline">28760725</pub-id>
          <pub-id pub-id-type="pii">v5i3e23</pub-id>
          <pub-id pub-id-type="pmcid">PMC5556259</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Lafferty</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <source>Text Mining: Classification, Clustering, and Applications</source>
          <year>2020</year>
          <publisher-loc>Boca Raton, FL</publisher-loc>
          <publisher-name>CRC Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Lafferty</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <source>Proceedings of the 23rd International Conference on Machine Learning</source>
          <year>2006</year>
          <month>06</month>
          <conf-name>ACM'06</conf-name>
          <conf-date>June 25-29, 2006</conf-date>
          <conf-loc>University in Pittsburgh, Pennsylvania</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tingley</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Stm: an r package for structural topic models</article-title>
          <source>J Stat Soft</source>
          <year>2019</year>
          <month>10</month>
          <day>31</day>
          <volume>91</volume>
          <issue>2</issue>
          <fpage>1</fpage>
          <lpage>40</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://archive.today/j05u3"/>
          </comment>
          <pub-id pub-id-type="doi">10.18637/jss.v091.i02</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lovell</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Ford</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>Effect of gender on prevalence of irritable bowel syndrome in the community: systematic review and meta-analysis</article-title>
          <source>Am J Gastroenterol</source>
          <year>2012</year>
          <month>07</month>
          <volume>107</volume>
          <issue>7</issue>
          <fpage>991</fpage>
          <lpage>1000</lpage>
          <pub-id pub-id-type="doi">10.1038/ajg.2012.131</pub-id>
          <pub-id pub-id-type="medline">22613905</pub-id>
          <pub-id pub-id-type="pii">ajg2012131</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pinto-Sanchez</surname>
              <given-names>MI</given-names>
            </name>
            <name name-style="western">
              <surname>Verdu</surname>
              <given-names>EF</given-names>
            </name>
          </person-group>
          <article-title>Non-celiac gluten or wheat sensitivity: it's complicated!</article-title>
          <source>Neurogastroenterol Motil</source>
          <year>2018</year>
          <month>08</month>
          <volume>30</volume>
          <issue>8</issue>
          <fpage>e13392</fpage>
          <pub-id pub-id-type="doi">10.1111/nmo.13392</pub-id>
          <pub-id pub-id-type="medline">30854780</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McNaughton</surname>
              <given-names>DT</given-names>
            </name>
            <name name-style="western">
              <surname>Andreasson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ljótsson</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Beath</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Hush</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Talley</surname>
              <given-names>NJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ljunggren</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Schmidt</surname>
              <given-names>PT</given-names>
            </name>
            <name name-style="western">
              <surname>Agréus</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>MP</given-names>
            </name>
          </person-group>
          <article-title>Effects of psychology and extragastrointestinal symptoms on health care use by subjects with and without irritable bowel syndrome</article-title>
          <source>Clin Gastroenterol Hepatol</source>
          <year>2020</year>
          <month>04</month>
          <volume>18</volume>
          <issue>4</issue>
          <fpage>847</fpage>
          <lpage>54.e1</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cgh.2019.07.019</pub-id>
          <pub-id pub-id-type="medline">31323378</pub-id>
          <pub-id pub-id-type="pii">S1542-3565(19)30752-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Satija</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Willett</surname>
              <given-names>WC</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>FB</given-names>
            </name>
          </person-group>
          <article-title>Understanding nutritional epidemiology and its role in policy</article-title>
          <source>Adv Nutr</source>
          <year>2015</year>
          <month>01</month>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>5</fpage>
          <lpage>18</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25593140"/>
          </comment>
          <pub-id pub-id-type="doi">10.3945/an.114.007492</pub-id>
          <pub-id pub-id-type="medline">25593140</pub-id>
          <pub-id pub-id-type="pii">6/1/5</pub-id>
          <pub-id pub-id-type="pmcid">PMC4288279</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferrara</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hua</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Seto</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>A focused review of smartphone diet-tracking apps: usability, functionality, coherence with behavior change theory, and comparative validity of nutrient intake and energy estimates</article-title>
          <source>J Med Internet Res Mhealth Uhealth</source>
          <year>2019</year>
          <month>05</month>
          <day>17</day>
          <volume>7</volume>
          <issue>5</issue>
          <fpage>e9232</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2019/5/e9232/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/mhealth.9232</pub-id>
          <pub-id pub-id-type="medline">31102369</pub-id>
          <pub-id pub-id-type="pii">v7i5e9232</pub-id>
          <pub-id pub-id-type="pmcid">PMC6543803</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schäfer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Jeanne</surname>
              <given-names>JF</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the effects of food on health in a world of evolving operational challenges</article-title>
          <source>Contemp Clin Trials Commun</source>
          <year>2018</year>
          <month>12</month>
          <volume>12</volume>
          <fpage>51</fpage>
          <lpage>4</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2451-8654(18)30084-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.conctc.2018.09.001</pub-id>
          <pub-id pub-id-type="medline">30259002</pub-id>
          <pub-id pub-id-type="pii">S2451-8654(18)30084-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC6151854</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khazen</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Jeanne</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Demaretz</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Schäfer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Fagherazzi</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Rethinking the use of mobile apps for dietary assessment in medical research</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>06</month>
          <day>18</day>
          <volume>22</volume>
          <issue>6</issue>
          <fpage>e15619</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/6/e15619/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/15619</pub-id>
          <pub-id pub-id-type="medline">32554383</pub-id>
          <pub-id pub-id-type="pii">v22i6e15619</pub-id>
          <pub-id pub-id-type="pmcid">PMC7333076</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>CK</given-names>
            </name>
            <name name-style="western">
              <surname>Gibson</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>Shepherd</surname>
              <given-names>SJ</given-names>
            </name>
          </person-group>
          <article-title>Design of clinical trials evaluating dietary interventions in patients with functional gastrointestinal disorders</article-title>
          <source>Am J Gastroenterol</source>
          <year>2013</year>
          <month>05</month>
          <volume>108</volume>
          <issue>5</issue>
          <fpage>748</fpage>
          <lpage>58</lpage>
          <pub-id pub-id-type="doi">10.1038/ajg.2013.77</pub-id>
          <pub-id pub-id-type="medline">23609614</pub-id>
          <pub-id pub-id-type="pii">ajg201377</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pérez-Pérez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pérez-Rodríguez</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Fdez-Riverola</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lourenço</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Using twitter to understand the human bowel disease community: exploratory analysis of key topics</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>08</month>
          <day>15</day>
          <volume>21</volume>
          <issue>8</issue>
          <fpage>e12610</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/8/e12610/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12610</pub-id>
          <pub-id pub-id-type="medline">31411142</pub-id>
          <pub-id pub-id-type="pii">v21i8e12610</pub-id>
          <pub-id pub-id-type="pmcid">PMC6711036</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="web">
          <source>mySymptoms App</source>
          <access-date>2020-10-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://skygazerlabs.com/wp/">https://skygazerlabs.com/wp/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Clevers</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Törnblom</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Simrén</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tack</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>van Oudenhove</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Relations between food intake, psychological distress, and gastrointestinal symptoms: a diary study</article-title>
          <source>United European Gastroenterol J</source>
          <year>2019</year>
          <month>08</month>
          <volume>7</volume>
          <issue>7</issue>
          <fpage>965</fpage>
          <lpage>73</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/31428421"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/2050640619839859</pub-id>
          <pub-id pub-id-type="medline">31428421</pub-id>
          <pub-id pub-id-type="pii">10.1177_2050640619839859</pub-id>
          <pub-id pub-id-type="pmcid">PMC6683644</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="web">
          <article-title>Qu’est-ce que le SNDS ?</article-title>
          <source>Système National Des Données De Santé</source>
          <year>2020</year>
          <access-date>2020-10-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://archive.today/7DDam%20on%2002Aug2019">http://archive.today/7DDam%20on%2002Aug2019</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sabaté</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Rivière</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jouet</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Gastaldi-Menager</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fagot-Campagna</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tuppin</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Healthcare use by 30,000 patients with irritable bowel syndrome (IBS) in France: a 5-year retrospective and one-year prospective national observational study</article-title>
          <source>BioMed Central Gastroenterol</source>
          <year>2019</year>
          <month>06</month>
          <day>27</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>111</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcgastroenterol.biomedcentral.com/articles/10.1186/s12876-019-1031-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12876-019-1031-z</pub-id>
          <pub-id pub-id-type="medline">31248366</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12876-019-1031-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC6598248</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Warren</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Blumenstock</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Schleimer</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Nadeau</surname>
              <given-names>KC</given-names>
            </name>
          </person-group>
          <article-title>Prevalence and severity of food allergies among US adults</article-title>
          <source>J Am Med Assoc Netw Open</source>
          <year>2019</year>
          <month>01</month>
          <day>4</day>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>e185630</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jamanetwork.com/journals/jamanetworkopen/fullarticle/10.1001/jamanetworkopen.2018.5630"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2018.5630</pub-id>
          <pub-id pub-id-type="medline">30646188</pub-id>
          <pub-id pub-id-type="pii">2720064</pub-id>
          <pub-id pub-id-type="pmcid">PMC6324316</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
