<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v25i1e47849</article-id>
      <article-id pub-id-type="pmid">38015600</article-id>
      <article-id pub-id-type="doi">10.2196/47849</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Scoping the Priorities and Concerns of Parents: Infodemiology Study of Posts on Mumsnet and Reddit</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Taylor</surname>
            <given-names>Rachael</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Yu</surname>
            <given-names>Jungok</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Thornton</surname>
            <given-names>Christopher</given-names>
          </name>
          <degrees>BSc, MRes, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>National Institute for Health and Care Research Innovation Observatory</institution>
            <institution>Population Health Sciences Institute</institution>
            <institution>Newcastle University</institution>
            <addr-line>3 Science Square</addr-line>
            <addr-line>Newcastle Helix</addr-line>
            <addr-line>Newcastle Upon Tyne, NE4 5TG</addr-line>
            <country>United Kingdom</country>
            <phone>44 191 208 2259</phone>
            <email>chris.thornton@newcastle.ac.uk</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0055-5500</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Lanyi</surname>
            <given-names>Kate</given-names>
          </name>
          <degrees>BSc, MRes</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3258-7286</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Wilkins</surname>
            <given-names>Georgina</given-names>
          </name>
          <degrees>BSc, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8800-3596</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Potter</surname>
            <given-names>Rhiannon</given-names>
          </name>
          <degrees>BSc, MRes</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0000-4316-250X</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Hunter</surname>
            <given-names>Emily</given-names>
          </name>
          <degrees>BA, MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9488-350X</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Kolehmainen</surname>
            <given-names>Niina</given-names>
          </name>
          <degrees>MSc, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9229-9913</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Pearson</surname>
            <given-names>Fiona</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1626-0862</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>National Institute for Health and Care Research Innovation Observatory</institution>
        <institution>Population Health Sciences Institute</institution>
        <institution>Newcastle University</institution>
        <addr-line>Newcastle Upon Tyne</addr-line>
        <country>United Kingdom</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Christopher Thornton <email>chris.thornton@newcastle.ac.uk</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>28</day>
        <month>11</month>
        <year>2023</year>
      </pub-date>
      <volume>25</volume>
      <elocation-id>e47849</elocation-id>
      <history>
        <date date-type="received">
          <day>20</day>
          <month>4</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>13</day>
          <month>9</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>18</day>
          <month>9</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>28</day>
          <month>9</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Christopher Thornton, Kate Lanyi, Georgina Wilkins, Rhiannon Potter, Emily Hunter, Niina Kolehmainen, Fiona Pearson. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 28.11.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2023/1/e47849" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Health technology innovation is increasingly supported by a bottom-up approach to priority setting, aiming to better reflect the concerns of its intended beneficiaries. Web-based forums provide parents with an outlet to share concerns, advice, and information related to parenting and the health and well-being of their children. They provide a rich source of data on parenting concerns and priorities that could inform future child health research and innovation.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The aim of the study is to identify common concerns expressed on 2 major web-based forums and cluster these to identify potential family health concern topics as indicative priority areas for future research and innovation.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We text-mined the r/Parenting subreddit (69,846 posts) and the parenting section of Mumsnet (99,848 posts) to create a large corpus of posts. A generative statistical model (latent Dirichlet allocation) was used to identify the most discussed topics in the corpus, and content analysis was applied to identify the parenting concerns found in a subset of posts.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>A model with 25 topics produced the highest coherence and a wide range of meaningful parenting concern topics. The most frequently expressed parenting concerns are related to their child’s sleep, self-care, eating (and food), behavior, childcare context, and the parental context including parental conflict. Topics directly associated with infants, such as potty training and bottle feeding, were more common on Mumsnet, while parental context and screen time were more common on r/Parenting.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Latent Dirichlet allocation topic modeling can be applied to gain a rapid, yet meaningful overview of parent concerns expressed on a large and diverse set of social media posts and used to complement traditional insight gathering methods. Parents framed their concerns in terms of children’s everyday health concerns, generating topics that overlap significantly with established family health concern topics. We provide evidence of the range of family health concerns found at these sources and hope this can be used to generate material for use alongside traditional insight gathering methods.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>childhood</kwd>
        <kwd>child</kwd>
        <kwd>toddler</kwd>
        <kwd>infant</kwd>
        <kwd>behavior</kwd>
        <kwd>parent</kwd>
        <kwd>parenting</kwd>
        <kwd>topic modeling</kwd>
        <kwd>data mining</kwd>
        <kwd>social media</kwd>
        <kwd>infodemiology</kwd>
        <kwd>Reddit</kwd>
        <kwd>web-based forum</kwd>
        <kwd>well-being</kwd>
        <kwd>children</kwd>
        <kwd>data</kwd>
        <kwd>family health</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Innovation for health and care is increasingly supported by bottom-up approaches to priority setting [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref4">4</xref>], reflecting the importance of allowing the views and concerns of the intended beneficiaries to influence the aims of innovation [<xref ref-type="bibr" rid="ref5">5</xref>]. Traditional priority-setting methods emphasize collaboration with the intended beneficiaries and can be a lengthy process, involving 15 steps in some cases [<xref ref-type="bibr" rid="ref6">6</xref>]. However, often a more rapid approach to priority setting may be desired, and so, here we present methods to rapidly identify the priorities and family health concerns of parents using web-based forum data.</p>
      <p>The views of parents and children have made important contributions to setting priorities and the conduct of childhood research [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. Parents are in most cases the primary caregivers for their children and are well placed to provide signals about the needs and concerns related to their children’s health and well-being. This enables the identification of gaps between current child health priorities and the main concerns of parents, which can help to inform the future direction of research and innovation [<xref ref-type="bibr" rid="ref11">11</xref>].</p>
      <p>Social media sites and web-based forums contain the thoughts, questions, opinions, and concerns of parents on a range of topics, where they initiate and drive discussions. Anonymous social media content can augment traditional methods [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref10">10</xref>] used to assess the views of parents and caregivers on a wide range of topics. Novel analysis methods have previously been used to aggregate social media–sourced stories relating to parental attitudes toward vaccine use in children [<xref ref-type="bibr" rid="ref12">12</xref>], to capture the experiences of new fathers [<xref ref-type="bibr" rid="ref13">13</xref>], to understand caregiver burdens [<xref ref-type="bibr" rid="ref14">14</xref>], and to understand the concerns of foster families during the COVID-19 pandemic [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
      <p>Similar methods can be used to identify the unmet needs of families more generally. In this way, it will become feasible to rapidly scope the thoughts and concerns of parents regarding parenting and the health and well-being of their families. Identifying parents’ views in this manner draws from a variety of first-hand experiences and expressions of specific needs, providing a rich source of data on family health concerns for which sufficient information or solutions are likely yet to be found. Here, we aim to provide valuable insight that can be used to identify unmet needs and inform innovation priorities [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref10">10</xref>].</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study was approved (REF 2417/25036) by the Faculty of Medical Sciences Research Ethics Committee, part of Newcastle University's Research Ethics Committee.</p>
      </sec>
      <sec>
        <title>Data Sources</title>
        <p>Mumsnet is a UK-based forum that is widely used to seek advice or emotional support [<xref ref-type="bibr" rid="ref16">16</xref>] through anonymous posts, usually in the form of a question, and responses from other users. The website is not restricted to discussion of parenting, but there is a specific forum for parenting questions. Data collected from Mumsnet have previously been used to describe the views of parents (particularly mothers) and answer a wide range of research questions [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref20">20</xref>].</p>
        <p>Reddit is a large and widely used general-purpose social media platform. It contains subreddits (subforums) for a wide range of topics, including several on parenting, with r/Parenting the largest of these parenting subreddits. Reddit has increasingly been recognized as an important resource for researchers [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>], including research into childhood and parenting [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref23">23</xref>].</p>
      </sec>
      <sec>
        <title>Data Collection and Cleaning</title>
        <p>Posts were collected from the r/Parenting subreddit between January 1, 2010, and February 1, 2022, using a custom Python (version 3.8.5; Python Software Foundation) script which called the Pushshift application programming interface [<xref ref-type="bibr" rid="ref24">24</xref>] and from the parenting forum on Mumsnet between April 19, 2001, and March 5, 2022, using a custom Python web scraping script. This captured all posts made on these forums between the dates specified. Posts from both sources were then cleaned by removing placeholders for deleted posts (eg, “[removed]” or “Message withdrawn at poster's request.”), and a spam post containing a single word was posted at a high frequency on one of the forums. We also standardized the spelling and language to British English (eg, diaper to nappy) and standardized apostrophe-like syntax to a single character. Cleaning was performed using custom Python code available at [<xref ref-type="bibr" rid="ref25">25</xref>].</p>
      </sec>
      <sec>
        <title>Data Preprocessing</title>
        <p>We then preprocessed the data, again using custom Python code, to create a corpus for the topic model. This involved removing stopwords (we used the English language stopwords from the Natural Language Tool Kit Python library [<xref ref-type="bibr" rid="ref26">26</xref>]). We also applied the standard preprocessing provided by the gensim Python library [<xref ref-type="bibr" rid="ref27">27</xref>] that removes most punctuation and numeric characters, removes words with fewer than 4 characters, converts all to lowercase, and stems all words. Bigrams (common 2-word phrases) were also detected using the gensim Phrases class and added to the corpus as single entities. The final corpus was composed of the preprocessed posts after words with fewer than 50 occurrences or words that occur in more than 50% of all posts removed.</p>
      </sec>
      <sec>
        <title>Modeling Indicative Topics of Common Concern</title>
        <p>Frequently discussed family health concern topics were detected using latent Dirichlet allocation (LDA), a generative statistical model, previously described in detail elsewhere [<xref ref-type="bibr" rid="ref28">28</xref>]. This involved first compiling a dictionary of all words used in the corpus of texts (social media posts in this case), with each word represented by a number. Each post was then encoded as a set (unordered list) of the words it contains. The LDA process calculates the probability of a given model generating the set of posts we have. This probability is then used to evaluate the model against the data, facilitating the estimation of an optimal model. In the case of gensim, an online variational inference algorithm described here [<xref ref-type="bibr" rid="ref29">29</xref>] is used to perform the optimization. To perform LDA topic modeling, we passed our corpus of texts (stored as vectors of word IDs) to the constructor of LdaMulticore class provided by the gensim library. Hyperparameters were set as follows: passes=20, chunksize=1000, decay=0.5, offset=64, iterations=1000, and gamma threshold=0.001. α was set to a fixed symmetric prior to 1/number of topics. To estimate the optimal number of topics, we performed a scan of the topic number parameter (with a range of 2 to 34 topics), using coherence as our evaluation metric. We repeated this for 10 random initial starting states and used the number with the highest mean coherence. The coherence was assessed by calculating a composite measure known as C<sub>v</sub>, previously shown to correlate well with human-assessed topic coherence [<xref ref-type="bibr" rid="ref30">30</xref>].</p>
        <p>Using the topic distribution calculated for each post, we estimated the probability of each post belonging to a topic. Posts were considered as belonging to a topic if the probability was greater than 75%.</p>
      </sec>
      <sec>
        <title>Labeling and Validation of Topics of Common Concerns</title>
        <p>Topics were interpreted in 2 ways. First, the top 4 words associated with the topic were identified and used to name the topic. This association was calculated using the equation <italic>a</italic>=log (∅)+log (∅)/<italic>P</italic>, where ∅ is the probability of the word given the topic, <italic>P</italic> is the probability of the word appearing in the corpus, and <italic>a</italic> is the association.</p>
        <p>Second, to further facilitate the interpretation of topics as indicative parenting or family health priority areas, we applied a 2-step qualitative analysis to a subset of 50 posts belonging to each topic. The first step was to identify parenting concerns without reference to any prior categories, and the second step was to place each post, if possible, into one or more of the parenting question categories identified by Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>]. The posts analyzed were randomly selected from all posts with a greater than 75% probability of being generated by the topic. The full analysis procedure is described below:</p>
        <list list-type="bullet">
          <list-item>
            <p>Posts were distributed among 4 researchers.</p>
          </list-item>
          <list-item>
            <p>Researchers read through each post.</p>
            <list>
              <list-item>
                <p>They identified and noted down each parenting or family health concern (if any) the post contains.
            </p>
              </list-item>
              <list-item>
                <p>They also identified whether the post could be categorized into one or more of the 11 question categories identified by Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
              </list-item>
              <list-item>
                <p>Posts were collated back together, discussed by the researchers, and then collective decisions were made on any that were unclear.</p>
              </list-item>
            </list>
          </list-item>
          <list-item>
            <p>The parenting or family health concerns occurring 3 or more times within the sample of 50 posts were taken forward as a signal of specific areas of concern. This threshold was selected because it gave a greater than 90% (93.2%) probability of the concern occurring in at least 1% of all posts in the topic (using a proportions z test to determine the likelihood that the proportion 3/50 is greater than 0.01; <italic>P</italic>=.07).</p>
          </list-item>
          <list-item>
            <p>The coherency of each topic was assessed manually by an analysis of the parenting concerns identified. If there was a single concern, or the concerns were closely related, the topic was deemed coherent. If there were multiple concerns that were distinct but with clear connections, the topic was deemed to have related clusters. If there were multiple concerns with no obvious connections, then the topic was deemed to have unrelated clusters.</p>
          </list-item>
        </list>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Topic Model</title>
        <p>We collated 169,694 posts in total, 99,848 from Mumsnet and 69,846 from the r/Parenting subreddit. Of these, 153,182 remained after cleaning and were provided to the LDA topic model for estimation. <xref rid="figure1" ref-type="fig">Figure 1</xref> shows the overall coherence of the topic model with an increasing number of topics. We found that the model coherence improved between 4 and 25 topics, after which it plateaued. A 25 topic model had the highest average coherence across repeats and so was selected as the model to take forward for further analysis.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>The coherence of the topic model as the number of topics increases. The figure shows the 10 repeats performed for each number of topics (thin line) and the mean of all repeats (thick line).</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e47849_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p><xref ref-type="table" rid="table1">Table 1</xref> describes the 25 topics, showing the number of posts assigned to a topic, the 4 words with the highest association with the topic, the specific areas of concern within the topic identified through the inductive content analysis, and the manual assessment of whether the sample of posts from each topic was coherent.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>The 25 topics identified by the optimal LDA<sup>a</sup> model alongside the inductively identified parenting or family health concerns.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="130"/>
            <col width="260"/>
            <col width="470"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td>Posts, n (%)</td>
                <td>LDA topic</td>
                <td>Inductively identified areas of specific parenting or family health concerns</td>
                <td>Coherence of concerns</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>4295 (12.18)</td>
                <td>sleep+night+wake+feed</td>
                <td>Bottle, breastfeeding, crying, nap, regression, routine, sleeping in parents’ bed, sleeping routine, waking up at night</td>
                <td>Related clusters</td>
              </tr>
              <tr valign="top">
                <td>2482 (7.04)</td>
                <td>size+wrap+buggi+cloth</td>
                <td>Affordability, cloth nappies, clothing for carrying baby, clothing temperature</td>
                <td>Related clusters</td>
              </tr>
              <tr valign="top">
                <td>2435 (6.9)</td>
                <td>potti+train+potti_train+toilet</td>
                <td>Potty/toilet training</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>2245 (6.36)</td>
                <td>food+milk+meal+drink</td>
                <td>Food ideas, formula, picky eater, puree food, water, weaning, whole food</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>2132 (6.04)</td>
                <td>pregnant+pregnanc+birth+famili</td>
                <td>Family issues, having another child, leaving child</td>
                <td>Related clusters</td>
              </tr>
              <tr valign="top">
                <td>2053 (5.82)</td>
                <td>work+nurseri+childcar+studi</td>
                <td>Childcare, financial advice, going back to work, studying</td>
                <td>Related clusters</td>
              </tr>
              <tr valign="top">
                <td>1669 (4.73)</td>
                <td>nappi+teeth+dispos+leak</td>
                <td>Cloth nappies, leaking nappies, washing nappies</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>1632 (4.63)</td>
                <td>parent+wife+father+relationship</td>
                <td>Depression, mental health, co-parenting, divorce, grandparents, parenting, parenting style, authoritarian parent</td>
                <td>Related clusters</td>
              </tr>
              <tr valign="top">
                <td>1521 (4.31)</td>
                <td>doctor+sick+cough+hospit</td>
                <td>Child feeling ill, Covid concerns, fever</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>1521 (4.31)</td>
                <td>plai+friend+school+swim</td>
                <td>Activities, fears, friends</td>
                <td>Related clusters</td>
              </tr>
              <tr valign="top">
                <td>1420 (4.03)</td>
                <td>parti+birthdai+seat+christma</td>
                <td>Advice on gifts, affordability, birthdays, Christmas, gifts for others’ children, presents, car seat safety, car seats, growing children, travel</td>
                <td>Unrelated clusters</td>
              </tr>
              <tr valign="top">
                <td>1420 (4.03)</td>
                <td>feel+like+guilti+feel_guilti</td>
                <td>Bad parent worries, feeling guilty, finding it difficult being a parent, feeling overwhelmed, frustration, hoping it will get better</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>1409 (3.99)</td>
                <td>told+behaviour+tell+punish</td>
                <td>Bad behavior, behavioral problems, domestic abuse, sibling violence, intimate partner violent interactions, separated father</td>
                <td>Related clusters</td>
              </tr>
              <tr valign="top">
                <td>1291 (3.66)</td>
                <td>school+book+teacher+read</td>
                <td>Adult course, book recommendations, school admissions, tutoring</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>1281 (3.63)</td>
                <td>reflux+poop+constip+formula</td>
                <td>Allergy, breastfeeding, colic, constipation, digestive issues, milk, milk allergy, reflux, stomach problems</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>958 (2.72)</td>
                <td>word+speech+autism+delai</td>
                <td>Autism, developmental concerns, education questions, speech, speech issues</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>923 (2.62)</td>
                <td>english+speak+languag+French</td>
                <td>Activities, development, friends, language</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>887 (2.51)</td>
                <td>scream+bedtim+tantrum+routin</td>
                <td>Bedtime, bedtime routine, crying/screaming, daily routines, dummy removal, naps, screaming/crying</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>797 (2.26)</td>
                <td>girl+phone+friend+messag</td>
                <td>Child internet concerns, monitoring, social media, social media harm, stranger interactions, trust</td>
                <td>Related clusters</td>
              </tr>
              <tr valign="top">
                <td>716 (2.03)</td>
                <td>room+bedroom+chair+mattress</td>
                <td>Affordability, baby sleeping space, bedroom, sleeping arrangements, bouncy chairs, highchair, living arrangements, safety, toy storage</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>534 (1.51)</td>
                <td>game+watch+video+movi</td>
                <td>Films, hobbies, sport, video games, YouTube</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>518 (1.47)</td>
                <td>hair+wash+clean+bath</td>
                <td>Bath, cleaning, hair, hygiene, nails, potty training, recommendations</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>511 (1.45)</td>
                <td>daycar+monei+covid+mask</td>
                <td>Activities, childcare, Covid, money, responsibility</td>
                <td>Related clusters</td>
              </tr>
              <tr valign="top">
                <td>313 (0.89)</td>
                <td>head+roll+crawl+stair</td>
                <td>Crawling, development, movement, rolling, standing, walking, equipment, falling, illness, injury fears, stairs</td>
                <td>Coherent</td>
              </tr>
              <tr valign="top">
                <td>313 (0.89)</td>
                <td>door+open+mommi+lock</td>
                <td>Child scared, children being funny, explaining death to child, explaining sex to child, pet issues</td>
                <td>Related clusters</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>LDA: latent Dirichlet allocation.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>We found that we could assign 35,276 (23%) posts to a topic with greater than 75% probability and that when we used this to filter posts, topics contained between 313 posts (head+roll+crawl+stair and door+open+mommi+lock) and 4295 posts (sleep+night+wake+feed). <xref rid="figure2" ref-type="fig">Figure 2</xref> shows the number of posts included at each stage of the processing pipeline. <xref rid="figure3" ref-type="fig">Figure 3</xref> shows each topic found by the model, positioned according to a 2-dimensional projection of the distance between topics as calculated by the LDAvis library [<xref ref-type="bibr" rid="ref32">32</xref>]. The 10 most common words in each topic are shown along with words shared between topics. In the final collection, Mumsnet contributed 26,648 posts, while r/Parenting contributed 8628 posts. <xref rid="figure4" ref-type="fig">Figure 4</xref> shows the proportion of posts from each platform that have been assigned to each topic. This allows us to see that some topics are more commonly discussed on 1 platform, for example, potty training and nappy changing topics (potti+train+potti_train+toilet, size+wrap+buggi+cloth, and nappi+teeth+dispos+leak) are more commonly discussed on Mumsnet, while topics on domestic abuse, divorce, and parenting style (told+behaviour+tell+punish and parent+wife+father+relationship) are more common on Reddit. Topics such as sleep (sleep+night+wake+feed), pregnancy (pregnant+pregnanc+birth+famili), or visiting the doctor (doctor+sick+cough+hospit) are equally common on both platforms.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>The number of posts from initial collection to final analysis. LDA: latent Dirichlet allocation.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e47849_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>The topics identified by the latent Dirichlet allocation process—each circle represents a topic, linked to the 10 most common words used in the topic. The size of the circle represents the size of the topic, and the size of the word represents the frequency of its use. Topics are linked together if their word frequency distribution has a cosine similarity above 0.4 (black line) or if they share a top 10 word (colored line) or both (dashed line).</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e47849_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>The frequency of topic occurrence within each source media. The number of posts is normalized by the total contributed by that source.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e47849_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Interpretation of Topics</title>
        <p>From the topic validation, we found that, for most LDA topics (14/25), the posts associated with them contained a coherent set of parental concern categories. <xref rid="figure5" ref-type="fig">Figure 5</xref> shows the parenting or family health concern categories identified for each topic. For example, the topic doctor+sick+cough+hospit contained categories all associated with children being ill or taken to the doctor: child feeling ill, COVID concerns, and fever. The topic word+speech+autism+delai likewise contained a coherent set of concerns around development: autism, developmental concerns, education questions, speech, and speech issues.</p>
        <p>Other topics (10/25) appeared to have 2 or more distinct but closely related and co-occurring concerns, for example, the topic sleep+night+wake+feed contained the categories bottle feeding, breastfeeding, infant crying, routine, sleeping in parents’ bed, sleeping routine, nap, regression, and waking up at night. Here, sleep issues co-occur with breastfeeding, and many posts in this topic discuss breastfeeding and sleep. The topic told+behaviour+tell+punish contains posts on intimate partner violence (including child on child, adult on child, and adult on adult violence), generalized concerns around separation and children spending time with their fathers, bad behavior, and behavioral problems. While most topics contain concerns that are related or those we would expect to co-occur, the topic parti+birthdai+seat+christma is an amalgamation of concerns around celebratory events (birthdays or Christmas) and car seats (safety concerns and advice about buying).</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>The categories identified manually from within posts sampled from each topic.</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e47849_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Assignment to Categories Identified by Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>]</title>
        <p>Traditional priority-setting approaches are an important comparator for topics extracted from large web-based data sets. Here, we make detailed comparisons between our topics and those identified by Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>] using traditional priority-setting methods.</p>
        <p>In 15 out of 25 of LDA topics, a majority of posts could be assigned to one or more of the parenting question categories devised by Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>]. <xref rid="figure6" ref-type="fig">Figure 6</xref> shows the Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>] categories identified within LDA topics. Several topics contain a majority of posts relevant to a single category. For example, sleep+night+wake+feed contained a majority of posts within the <italic>Sleeping or night-time waking</italic> category. Others contained a plurality of categories, for example, the LDA topic door+open+mommi-lock is split between <italic>Child development and learning</italic>, <italic>Safety and injury prevention</italic>, <italic>Mental health</italic>, <italic>Parenting and behaviour</italic>, <italic>Sleeping or night-time waking</italic>, and <italic>Growth, nutrition and physical activity</italic>.</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>The proportion of posts in each topic assigned to the child health categories identified by Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
          </caption>
          <graphic xlink:href="jmir_v25i1e47849_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>For 10/25 of the LDA topics, a majority of posts were not attributable to any of the categories identified by Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>]. In 5 out of 10 of these topics, less than 25% of posts could be attributed to a category. These topics were pregnant+pregnanc+birth+famili—a topic concerned with family planning, nappi+teeth+dispos+leak—a topic concerned with reusable nappies, size+wrap+buggi+cloth—another topic concerned with reusable nappies as well as clothing and transporting a baby, hair+wash+clean+bath—a topic concerning hygiene, and work+nurseri+childcar+studi—a topic covering balancing childcare with work and studying.</p>
        <p>The topics identified here cover 10 out of 11 of the Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>] categories. <italic>Environmental toxins</italic> is the only one without representation. <italic>Parenting and behaviour</italic>, <italic>Child development and learning</italic>, <italic>Growth, nutrition and physical activity</italic>, <italic>Sleeping or night-time waking</italic>, <italic>Screen time and media exposure</italic>, and <italic>Preventing childhood infections and other diseases</italic> are all well represented—presenting in multiple topics and as a majority in at least one. <italic>Mental health</italic> and <italic>Poverty and access to car</italic>e are present in multiple topics without being a majority in any, and <italic>Oral health, vision, and hearing</italic> is present in small numbers in 3 topics.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Results</title>
        <p>We have collated posts from the r/Parenting forum and the Mumsnet parenting forum and then used LDA to model the most common topics of discussion. We found that a model with 25 topics was the most coherent. An analysis of the content of posts associated with these topics indicated that most topics brought together posts on a related set of parenting concerns, and we found significant overlap between the content of our LDA topics and parenting priority categories identified using traditional priority-setting methods [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>A key strength of this work is that topic modeling using LDA allows us to use a large collection of posts, revealing the latent semantic structure present within them; however, its outputs can vary significantly depending on parameterization, and the evaluation of output quality is a contentious issue [<xref ref-type="bibr" rid="ref33">33</xref>]. We have used one type of coherence score (C<sub>v</sub>) [<xref ref-type="bibr" rid="ref30">30</xref>] to optimize our selection of the number of topics parameter. However, there are multiple scores that can be used to evaluate the coherence of the model and others that evaluate the model through its predictive ability (perplexity) [<xref ref-type="bibr" rid="ref34">34</xref>]. While there is strong evidence that C<sub>v</sub> correlates more strongly with human interpretability than other evaluation functions for certain benchmark data sets [<xref ref-type="bibr" rid="ref30">30</xref>], there is no guarantee that our parameter selection is optimal. However, we do consider it to be functional, providing topics that we have been able to interpret through further analysis.</p>
        <p>The additional methods used to interpret the topics identified using LDA are also a strength of this work. Applying content analysis allows the context of each post and a subjective interpretation to feed into the description of the topic, while assignment to previously established parenting priority categories [<xref ref-type="bibr" rid="ref31">31</xref>] leverages the data and analysis of previous work. Typically, topic modeling studies use the words most associated with a topic [<xref ref-type="bibr" rid="ref35">35</xref>], or a human interpretation of these words [<xref ref-type="bibr" rid="ref36">36</xref>], to provide a description, but this may not always provide the reader with a complete picture of the topic. Combining LDA and qualitative analysis of a subset of posts has been used previously to provide a more detailed interpretation of topics of parent discussions of fussy eating [<xref ref-type="bibr" rid="ref37">37</xref>] and the concerns of foster families during the COVID-19 pandemic [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
        <p>However, our content analysis and categorization also have limitations. To reduce the labor requirements of the task, we have analyzed a sample of 50 posts from each topic (1%-16% of the total posts in each topic compared to 100 posts or 20% of posts per topic used by others [<xref ref-type="bibr" rid="ref15">15</xref>]). Therefore, the concerns identified may not be fully representative, for example, we could be 90% confident that a concern identified 3 times in the sample of 50 would appear in 0.4%-11.5% of the posts in that topic. A topic appearing 20 times would appear in between 28.6% and 51.3% of posts. So, while the topic-specific concerns shown in <xref ref-type="table" rid="table1">Table 1</xref> and <xref rid="figure5" ref-type="fig">Figure 5</xref> are likely to occur beyond the sample, the proportions they indicate have a large margin of error, and the list is unlikely to be exhaustive. We also recognize that many posts are discarded before content analysis (those with less than 75% probability of being generated by a topic), and so the themes identified are only those present in posts with a strong affinity to the topic.</p>
        <p>Another limitation of this work comes from the representativeness of the social media users as a sample of the wider population [<xref ref-type="bibr" rid="ref38">38</xref>]. As there are no detailed analyses of the sociodemographics of either source available, we can only speculate on whether the views expressed on these forums represent those of the wider population (including those from significant economic deprivation).</p>
        <p>To address this, we envision that future work will take the outputs generated here (the descriptions of the topics) and use them as material for targeted engagement with underrepresented groups such as those on low incomes. This will allow an assessment of whether the views expressed on these forums differ from those of the underrepresented groups and will allow us to bring in the voice of these groups and allow expression of their concerns. We also envision that these data sources may be used to shape future research priorities and identify unmet needs across health and childcare provision, highlighting further the importance of acknowledging the underrepresented voices.</p>
      </sec>
      <sec>
        <title>Comparison With Prior Work</title>
        <p>Previous priority-setting work has identified robust parental concerns relating to childhood chronic disease [<xref ref-type="bibr" rid="ref39">39</xref>], preventative care [<xref ref-type="bibr" rid="ref31">31</xref>], and mental health [<xref ref-type="bibr" rid="ref40">40</xref>]. The views collected in our analysis come from the general population, and so, the concerns found are most comparable to those previously found on preventative care and mental health.</p>
        <p>Our results strengthen the evidence signaling parent priorities in 10 of the 11 parent priority categories presented by Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>] on pediatric preventative care. Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>] also present the top 10 most important unanswered questions from the perspective of parents and clinicians. Some of these questions are clearly reflected in the priorities identified here. For example, we identify several topics (eg, told+behaviour+tell+punish) that include behavioral problems as a priority, a priority also articulated by Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>] with the question “What are effective strategies for behaviour management in children?”. Concerns around the development of one’s child are strongly expressed within the word+speech+autism+delai topic echoing the question “What are effective methods for screening for developmental delay in children?” presented by Lavigne et al [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        <p>Both Mumsnet and Reddit have been the subject of prior research into parental concerns and pediatric or maternal health [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref41">41</xref>]. For example, previous work has highlighted the use of Mumsnet by parents of children with mental health needs [<xref ref-type="bibr" rid="ref20">20</xref>] showing that it was used primarily to offer and receive emotional support and to find advice on methods or techniques that could be used without the help of professionals. We have also found evidence of parents seeking support for children with mental health issues (topic 23—parent+wife+father+relationship) with intergenerational mental health issues, divorce, and authoritarian parenting also found in this topic.</p>
        <p>Previous work using Reddit as a data source has used LDA alongside thematic analysis to investigate parental discussion of fussy eating [<xref ref-type="bibr" rid="ref37">37</xref>]. Using similar methods (but a different subreddit r/Toddler) to those presented here, this work used LDA to cluster posts into topics and then took a single topic (fussy eating) forward for further thematic qualitative analysis.</p>
        <p>This work differs from the above by presenting an overview of discussion on 2 broadly defined parenting forums rather than a more detailed analysis of specific issues. Previous work that has taken a similarly broad approach includes an analysis of the posts on the subreddits r/Mommit and r/Daddit, again combining LDA topic modeling with qualitative analysis to give a broad overview of discussion topics and presenting a comparison between the 2 forums [<xref ref-type="bibr" rid="ref23">23</xref>]. We build on this work by including 2 much larger data sets (99,848 posts from Mumsnet and 69,846 posts from r/Parenting) and outline methods to visualize and perform an inductive content analysis of a data set of this size. We identify many similar topics, including sleep issues, toilet training, food/fussy eating, managing multiple children/sibling conflict, talking about difficult issues, phone/social media use, and parental guilt. This indicates that there are robust concerns that emerge as topics of discussion on a range of parenting forums when this type of analysis is applied. Several additional concerns such as child hygiene, fear of child injury, and fear of being a bad parent were also identified.</p>
        <p>Recent work has also applied LDA modeling to parenting forums such as Momsholic [<xref ref-type="bibr" rid="ref42">42</xref>]. They found feeding, sleeping, medical problems, development, and learning to be the most discussed topics—all major topics found within our analysis. Both studies also agree that sleep is the most discussed.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Here, we present further evidence on the priorities and concerns of parents through the identification of topics commonly discussed on 2 well-used parenting advice forums (Mumsnet and r/Parenting). Our results show that LDA can be used to identify common parenting concerns from large-scale parenting forum data, and alongside the content analysis outlined here can be used to provide an indicative map of concerns and priorities commonly discussed. This provides a method for the rapid identification of concerns and priorities from these, or similar, large-scale data sources. We also hope our results can be used as a signpost for others looking to use data from these sources, for example, in the development of content for targeted engagement or qualitative research with families.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">LDA</term>
          <def>
            <p>latent Dirichlet allocation</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This research was funded by the National Institute for Health Research Innovation Observatory (UK).</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>EYY</given-names>
            </name>
            <name name-style="western">
              <surname>Gobat</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dubois</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bedson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>de Almeida</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <article-title>Bottom-up citizen engagement for health emergency and disaster risk management: directions since COVID-19</article-title>
          <source>Lancet</source>
          <year>2021</year>
          <volume>398</volume>
          <issue>10296</issue>
          <fpage>194</fpage>
          <lpage>196</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34097857"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(21)01233-2</pub-id>
          <pub-id pub-id-type="medline">34097857</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(21)01233-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC8800561</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Orgill</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Marchal</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Shung-King</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sikuza</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gilson</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Bottom-up innovation for health management capacity development: a qualitative case study in a South African health district</article-title>
          <source>BMC Public Health</source>
          <year>2021</year>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>587</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-021-10546-w"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12889-021-10546-w</pub-id>
          <pub-id pub-id-type="medline">33761911</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12889-021-10546-w</pub-id>
          <pub-id pub-id-type="pmcid">PMC7992952</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhopal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Norheim</surname>
              <given-names>OF</given-names>
            </name>
          </person-group>
          <article-title>Priority setting and net zero healthcare: how much health can a tonne of carbon buy?</article-title>
          <source>BMJ</source>
          <year>2021</year>
          <volume>375</volume>
          <fpage>e067199</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.bmj.com/content/375/bmj-2021-067199"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmj-2021-067199</pub-id>
          <pub-id pub-id-type="medline">34711584</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rosa</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Kimpeler</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Schirrmeister</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Warnke</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Participatory foresight and reflexive innovation: setting policy goals and developing strategies in a bottom-up, mission-oriented, sustainable way</article-title>
          <source>Eur J Futures Res</source>
          <year>2021</year>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>15</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://link.springer.com/article/10.1186/s40309-021-00171-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s40309-021-00171-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Cathain</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Croot</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Duncan</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rousseau</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Sworn</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Turner</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Yardley</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hoddinott</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Guidance on how to develop complex interventions to improve health and healthcare</article-title>
          <source>BMJ Open</source>
          <year>2019</year>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>e029954</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=31420394"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2019-029954</pub-id>
          <pub-id pub-id-type="medline">31420394</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2019-029954</pub-id>
          <pub-id pub-id-type="pmcid">PMC6701588</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rudan</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Gibson</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Ameratunga</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Arifeen</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Bhutta</surname>
              <given-names>ZA</given-names>
            </name>
            <name name-style="western">
              <surname>Black</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Black</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Carneiro</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Chan</surname>
              <given-names>KY</given-names>
            </name>
            <name name-style="western">
              <surname>Chandramohan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chopra</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cousens</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Darmstadt</surname>
              <given-names>GL</given-names>
            </name>
            <name name-style="western">
              <surname>Gardner</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Hess</surname>
              <given-names>SY</given-names>
            </name>
            <name name-style="western">
              <surname>Hyder</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Kapiriri</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Kosek</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lanata</surname>
              <given-names>CF</given-names>
            </name>
            <name name-style="western">
              <surname>Lansang</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Lawn</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tomlinson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tsai</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Webster</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Setting priorities in global child health research investments: guidelines for implementation of CHNRI method</article-title>
          <source>Croat Med J</source>
          <year>2008</year>
          <volume>49</volume>
          <issue>6</issue>
          <fpage>720</fpage>
          <lpage>733</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/19090596"/>
          </comment>
          <pub-id pub-id-type="doi">10.3325/cmj.2008.49.720</pub-id>
          <pub-id pub-id-type="medline">19090596</pub-id>
          <pub-id pub-id-type="pmcid">PMC2621022</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hjälmhult</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Glavin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Okland</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tveiten</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Parental groups during the child's first year: an interview study of parents' experiences</article-title>
          <source>J Clin Nurs</source>
          <year>2014</year>
          <volume>23</volume>
          <issue>19-20</issue>
          <fpage>2980</fpage>
          <lpage>2989</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/doi/10.1111/jocn.12528"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/jocn.12528</pub-id>
          <pub-id pub-id-type="medline">24393530</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hogan</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <source>Researching Children's Experience: Approaches and Methods</source>
          <year>2011</year>
          <publisher-loc>London</publisher-loc>
          <publisher-name>SAGE Publications Ltd</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zwaanswijk</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>van Dulmen</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Advantages of asynchronous online focus groups and face-to-face focus groups as perceived by child, adolescent and adult participants: a survey study</article-title>
          <source>BMC Res Notes</source>
          <year>2014</year>
          <volume>7</volume>
          <fpage>756</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcresnotes.biomedcentral.com/articles/10.1186/1756-0500-7-756"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1756-0500-7-756</pub-id>
          <pub-id pub-id-type="medline">25341440</pub-id>
          <pub-id pub-id-type="pii">1756-0500-7-756</pub-id>
          <pub-id pub-id-type="pmcid">PMC4213506</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adler</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Salanterä</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zumstein-Shaha</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Focus group interviews in child, youth, and parent research: an integrative literature review</article-title>
          <source>Int J Qual Methods</source>
          <year>2019</year>
          <volume>18</volume>
          <fpage>1609406919887274</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/1609406919887274"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/1609406919887274</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Preston</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nafria</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ohmer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gaillard</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dicks</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>West</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Turner</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Developing a more tailored approach to patient and public involvement with children and families in pediatric clinical research: lessons learned</article-title>
          <source>Ther Innov Regul Sci</source>
          <year>2022</year>
          <volume>56</volume>
          <issue>6</issue>
          <fpage>948</fpage>
          <lpage>963</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35182389"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s43441-022-00382-4</pub-id>
          <pub-id pub-id-type="medline">35182389</pub-id>
          <pub-id pub-id-type="pii">10.1007/s43441-022-00382-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC8857393</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tangherlini</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Roychowdhury</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Glenn</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Crespi</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Bandari</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wadia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Falahi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ebrahimzadeh</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bastani</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>"Mommy Blogs" and the vaccination exemption narrative: results from a machine-learning approach for story aggregation on parenting social media sites</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2016</year>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>e166</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2016/2/e166/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.6586</pub-id>
          <pub-id pub-id-type="medline">27876690</pub-id>
          <pub-id pub-id-type="pii">v2i2e166</pub-id>
          <pub-id pub-id-type="pmcid">PMC5141339</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Teague</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shatte</surname>
              <given-names>AB</given-names>
            </name>
          </person-group>
          <article-title>Exploring the transition to fatherhood: feasibility study using social media and machine learning</article-title>
          <source>JMIR Pediatr Parent</source>
          <year>2018</year>
          <volume>1</volume>
          <issue>2</issue>
          <fpage>e12371</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pediatrics.jmir.org/2018/2/e12371/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12371</pub-id>
          <pub-id pub-id-type="medline">31518298</pub-id>
          <pub-id pub-id-type="pii">v1i2e12371</pub-id>
          <pub-id pub-id-type="pmcid">PMC6715057</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shoults</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Rutherford</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Kemp</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Addicott</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hayes</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Gan</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Larson-Prior</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bona</surname>
              <given-names>JP</given-names>
            </name>
          </person-group>
          <article-title>Analysis of caregiver burden expressed in social media discussions</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2023</year>
          <volume>20</volume>
          <issue>3</issue>
          <fpage>1933</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph20031933"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph20031933</pub-id>
          <pub-id pub-id-type="medline">36767297</pub-id>
          <pub-id pub-id-type="pii">ijerph20031933</pub-id>
          <pub-id pub-id-type="pmcid">PMC9915402</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JY</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>OD</given-names>
            </name>
            <name name-style="western">
              <surname>Ammari</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Using social media Reddit data to examine foster families' concerns and needs during COVID-19</article-title>
          <source>Child Abuse Negl</source>
          <year>2021</year>
          <volume>121</volume>
          <fpage>105262</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34411874"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.chiabu.2021.105262</pub-id>
          <pub-id pub-id-type="medline">34411874</pub-id>
          <pub-id pub-id-type="pii">S0145-2134(21)00335-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC8440933</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedersen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lupton</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>‘What are you feeling right now?’ communities of maternal feeling on Mumsnet</article-title>
          <source>Emot Space Soc</source>
          <year>2018</year>
          <volume>26</volume>
          <fpage>57</fpage>
          <lpage>63</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/abs/pii/S175545861630010X?via%3Dihub"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.emospa.2016.05.001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedersen</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>The good, the bad and the 'good enough' mother on the UK parenting forum Mumsnet</article-title>
          <source>Womens Stud Int Forum</source>
          <year>2016</year>
          <volume>59</volume>
          <fpage>32</fpage>
          <lpage>38</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/abs/pii/S027753951530159X?via%3Dihub"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.wsif.2016.09.004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Giles</surname>
              <given-names>DC</given-names>
            </name>
          </person-group>
          <article-title>Observing real-world groups in the virtual field: the analysis of online discussion</article-title>
          <source>Br J Soc Psychol</source>
          <year>2016</year>
          <volume>55</volume>
          <issue>3</issue>
          <fpage>484</fpage>
          <lpage>498</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bpspsychub.onlinelibrary.wiley.com/doi/10.1111/bjso.12139"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/bjso.12139</pub-id>
          <pub-id pub-id-type="medline">26916617</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Botelle</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Willott</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Birth, attitudes and placentophagy: a thematic discourse analysis of discussions on UK parenting forums</article-title>
          <source>BMC Pregnancy Childbirth</source>
          <year>2020</year>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>134</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpregnancychildbirth.biomedcentral.com/articles/10.1186/s12884-020-2824-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12884-020-2824-3</pub-id>
          <pub-id pub-id-type="medline">32138706</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12884-020-2824-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC7059278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Croucher</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mertan</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Shafran</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bennett</surname>
              <given-names>SD</given-names>
            </name>
          </person-group>
          <article-title>The use of mumsnet by parents of young people with mental health needs: qualitative investigation</article-title>
          <source>JMIR Ment Health</source>
          <year>2020</year>
          <volume>7</volume>
          <issue>9</issue>
          <fpage>e18271</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2020/9/e18271/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/18271</pub-id>
          <pub-id pub-id-type="medline">32880583</pub-id>
          <pub-id pub-id-type="pii">v7i9e18271</pub-id>
          <pub-id pub-id-type="pmcid">PMC7499161</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Medvedev</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Lambiotte</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Delvenne</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Ghanbarnejad</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Roy</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Karimi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Delvenne</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Mitra</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>The anatomy of Reddit: an overview of academic research</article-title>
          <source>Dynamics on and of Complex Networks III: Machine Learning and Statistical Physics Approaches</source>
          <year>2019</year>
          <publisher-loc>Cham</publisher-loc>
          <publisher-name>Springer International Publishing</publisher-name>
          <fpage>183</fpage>
          <lpage>204</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Proferes</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gilbert</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fiesler</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zimmer</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Studying Reddit: a systematic overview of disciplines, approaches, methods, and ethics</article-title>
          <source>Soc Media Soc</source>
          <year>2021</year>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>205630512110190</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/20563051211019004"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/20563051211019004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Westrupp</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Greenwood</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Fuller-Tyszkiewicz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Berkowitz</surname>
              <given-names>TS</given-names>
            </name>
            <name name-style="western">
              <surname>Hagg</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Youssef</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Text mining of Reddit posts: using latent Dirichlet allocation to identify common parenting issues</article-title>
          <source>PLoS One</source>
          <year>2022</year>
          <volume>17</volume>
          <issue>2</issue>
          <fpage>e0262529</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0262529"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0262529</pub-id>
          <pub-id pub-id-type="medline">35108299</pub-id>
          <pub-id pub-id-type="pii">PONE-D-21-07563</pub-id>
          <pub-id pub-id-type="pmcid">PMC8809584</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baumgartner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zannettou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Keegan</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Squire</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Blackburn</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The Pushshift Reddit dataset</article-title>
          <year>2020</year>
          <conf-name>The Fourteenth International AAAI Conference on Web and Social Media (ICWSM-20)</conf-name>
          <conf-date>Atlanta, GA, USA</conf-date>
          <conf-loc>June 8-11, 2019</conf-loc>
          <fpage>830</fpage>
          <lpage>839</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ojs.aaai.org/index.php/ICWSM/article/view/7347"/>
          </comment>
          <pub-id pub-id-type="doi">10.1609/icwsm.v14i1.7347</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thornton</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>haeste/SocialMediaScanning: For JMIR publication</article-title>
          <source>Zenodo</source>
          <access-date>2023-11-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://zenodo.org/records/8356362">https://zenodo.org/records/8356362</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bird</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Loper</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <source>Natural Language Processing with Python</source>
          <year>2009</year>
          <publisher-loc>Sebastopol, CA</publisher-loc>
          <publisher-name>O'Reilly Media Inc</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rehurek</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sojka</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <source>Gensim–Python framework for vector space modelling</source>
          <year>2011</year>
          <publisher-loc>Brno</publisher-loc>
          <publisher-name>Masaryk University</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>MI</given-names>
            </name>
          </person-group>
          <article-title>Latent Dirichlet allocation</article-title>
          <source>J Mach Learn Res</source>
          <year>2003</year>
          <volume>3</volume>
          <fpage>1022</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/volume3/blei03a/blei03a.pdf?ref=https://githubhelp.com"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hoffman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bach</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Online learning for latent Dirichlet allocation</article-title>
          <source>Advances in Neural Information Processing Systems 23</source>
          <year>2010</year>
          <conf-name>24th Annual Conference on Neural Information Processing Systems 2010</conf-name>
          <conf-date>December 6-11, 2010</conf-date>
          <conf-loc>Hyatt Regency, Vancouver, Canada</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Röder</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Both</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hinneburg</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Exploring the space of topic coherence measures</article-title>
          <year>2015</year>
          <conf-name>WSDM 2015: Eighth ACM International Conference on Web Search and Data Mining</conf-name>
          <conf-date>February 2-6, 2015</conf-date>
          <conf-loc>Shanghai, China</conf-loc>
          <fpage>399</fpage>
          <lpage>408</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/2684822.2685324"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2684822.2685324</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lavigne</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Birken</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Maguire</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Straus</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Laupacis</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Priority setting in paediatric preventive care research</article-title>
          <source>Arch Dis Child</source>
          <year>2017</year>
          <volume>102</volume>
          <issue>8</issue>
          <fpage>748</fpage>
          <lpage>753</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://adc.bmj.com/content/102/8/748"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/archdischild-2016-312284</pub-id>
          <pub-id pub-id-type="medline">28404552</pub-id>
          <pub-id pub-id-type="pii">archdischild-2016-312284</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sievert</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shirley</surname>
              <given-names>KE</given-names>
            </name>
          </person-group>
          <article-title>LDAvis: a method for visualizing and interpreting topics</article-title>
          <year>2015</year>
          <conf-name>Proceedings of the Workshop on Interactive Language Learning, Visualization, and Interfaces</conf-name>
          <conf-date>June 27, 2014</conf-date>
          <conf-loc>Baltimore, MA, USA</conf-loc>
          <fpage>63</fpage>
          <lpage>70</lpage>
          <pub-id pub-id-type="doi">10.3115/v1/w14-3110</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hoyle</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Goel</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Peskov</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hian-Cheong</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Boyd-Graber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Resnik</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Is automated topic model evaluation broken?: The incoherence of coherence</article-title>
          <year>2021</year>
          <conf-name>35th Conference on Neural Information Processing Systems (NeurIPS 2021)</conf-name>
          <conf-date>December 6-14, 2021</conf-date>
          <conf-loc>Online</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O’Callaghan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Carthy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cunningham</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>An analysis of the coherence of descriptors in topic modeling</article-title>
          <source>Expert Syst Appl</source>
          <year>2015</year>
          <volume>42</volume>
          <issue>13</issue>
          <fpage>5645</fpage>
          <lpage>5657</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/10/e22635/"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.eswa.2015.02.055</pub-id>
          <pub-id pub-id-type="pii">v22i10e22635</pub-id>
          <pub-id pub-id-type="pmcid">PMC7575341</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Low</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Rumker</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Talkar</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Torous</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cecchi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Ghosh</surname>
              <given-names>SS</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing reveals vulnerable mental health support groups and heightened health anxiety on Reddit during COVID-19: observational study</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <volume>22</volume>
          <issue>10</issue>
          <fpage>e22635</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/10/e22635/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/22635</pub-id>
          <pub-id pub-id-type="medline">32936777</pub-id>
          <pub-id pub-id-type="pii">v22i10e22635</pub-id>
          <pub-id pub-id-type="pmcid">PMC7575341</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Okon</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Rachakonda</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>HJ</given-names>
            </name>
            <name name-style="western">
              <surname>Callison-Burch</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lipoff</surname>
              <given-names>JB</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing of Reddit data to evaluate dermatology patient experiences and therapeutics</article-title>
          <source>J Am Acad Dermatol</source>
          <year>2020</year>
          <volume>83</volume>
          <issue>3</issue>
          <fpage>803</fpage>
          <lpage>808</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jaad.2019.07.014</pub-id>
          <pub-id pub-id-type="medline">31306722</pub-id>
          <pub-id pub-id-type="pii">S0190-9622(19)32371-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Markides</surname>
              <given-names>BR</given-names>
            </name>
            <name name-style="western">
              <surname>Laws</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hesketh</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Maddison</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Denney-Wilson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Campbell</surname>
              <given-names>KJ</given-names>
            </name>
          </person-group>
          <article-title>A thematic cluster analysis of parents' online discussions about fussy eating</article-title>
          <source>Matern Child Nutr</source>
          <year>2022</year>
          <volume>18</volume>
          <issue>2</issue>
          <fpage>e13316</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35132813"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/mcn.13316</pub-id>
          <pub-id pub-id-type="medline">35132813</pub-id>
          <pub-id pub-id-type="pmcid">PMC8932712</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mellon</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Prosser</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Twitter and Facebook are not representative of the general population: political attitudes and demographics of British social media users</article-title>
          <source>Res Politics</source>
          <year>2017</year>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>205316801772000</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/full/10.1177/2053168017720008"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/2053168017720008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Odgers</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lopez-Vargas</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Davidson</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jaffe</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McKenzie</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pinkerton</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wake</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Richmond</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Crowe</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Caldwell</surname>
              <given-names>PHY</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Couper</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Haddad</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kassai</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Craig</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Research priority setting in childhood chronic disease: a systematic review</article-title>
          <source>Arch Dis Child</source>
          <year>2018</year>
          <volume>103</volume>
          <issue>10</issue>
          <fpage>942</fpage>
          <lpage>951</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://adc.bmj.com/content/103/10/942"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/archdischild-2017-314631</pub-id>
          <pub-id pub-id-type="medline">29643102</pub-id>
          <pub-id pub-id-type="pii">archdischild-2017-314631</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cawthorpe</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wilkes</surname>
              <given-names>TCR</given-names>
            </name>
            <name name-style="western">
              <surname>Rahman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Conner-Spady</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>McGurran</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Noseworthy</surname>
              <given-names>TW</given-names>
            </name>
          </person-group>
          <article-title>Priority-setting for children's mental health: clinical usefulness and validity of the priority criteria score</article-title>
          <source>J Can Acad Child Adolesc Psychiatry</source>
          <year>2007</year>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>18</fpage>
          <lpage>26</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/18392175"/>
          </comment>
          <pub-id pub-id-type="medline">18392175</pub-id>
          <pub-id pub-id-type="pmcid">PMC2276170</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sutter</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pham</surname>
              <given-names>GV</given-names>
            </name>
            <name name-style="western">
              <surname>Yun</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Narang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Sundaram</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Fiese</surname>
              <given-names>BH</given-names>
            </name>
          </person-group>
          <article-title>Food parenting topics in social media posts: development of a coding system, examination of frequency of food parenting concepts, and comparison across Reddit and Facebook</article-title>
          <source>Appetite</source>
          <year>2021</year>
          <volume>161</volume>
          <fpage>105137</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/abs/pii/S0195666321000453?via%3Dihub"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.appet.2021.105137</pub-id>
          <pub-id pub-id-type="medline">33493607</pub-id>
          <pub-id pub-id-type="pii">S0195-6663(21)00045-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>June</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Analysis of parenting informational needs for mothers with infants and toddlers using text-mining</article-title>
          <source>Child Youth Serv Rev</source>
          <year>2023</year>
          <volume>145</volume>
          <fpage>106768</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/abs/pii/S0190740922004042?via%3Dihub"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.childyouth.2022.106768</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
