<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id><journal-id journal-id-type="publisher-id">jmir</journal-id><journal-id journal-id-type="index">1</journal-id><journal-title>Journal of Medical Internet Research</journal-title><abbrev-journal-title>J Med Internet Res</abbrev-journal-title><issn pub-type="epub">1438-8871</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v28i1e88519</article-id><article-id pub-id-type="doi">10.2196/88519</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Engagement Trends in Online Vaccine Content: Longitudinal YouTube Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Tizzani</surname><given-names>Michele</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Mejova</surname><given-names>Yelena</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib></contrib-group><aff id="aff1"><institution>Section for Cognitive Systems, Department of Applied Mathematics and Computer Science, Technical University of Denmark</institution><addr-line>Richard Petersens Plads</addr-line><addr-line>Kgs. Lyngby</addr-line><addr-line>Capital Region</addr-line><country>Denmark</country></aff><aff id="aff2"><institution>Institute for Scientific Interchange</institution><addr-line>Turin</addr-line><addr-line>Piedmont</addr-line><country>Italy</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Hussain</surname><given-names>Waqas Ghulam</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Fan</surname><given-names>Yifan</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Zaidi</surname><given-names>Zainab</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Liu</surname><given-names>Zhao</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Kmetty</surname><given-names>Zoltan</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Michele Tizzani, PhD, Section for Cognitive Systems, Department of Applied Mathematics and Computer Science, Technical University of Denmark, Richard Petersens Plads, Kgs. Lyngby, Capital Region, 2800, Denmark, 45 45 25 30 31; <email>micti@dtu.dk</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>19</day><month>6</month><year>2026</year></pub-date><volume>28</volume><elocation-id>e88519</elocation-id><history><date date-type="received"><day>26</day><month>11</month><year>2025</year></date><date date-type="rev-recd"><day>20</day><month>04</month><year>2026</year></date><date date-type="accepted"><day>30</day><month>04</month><year>2026</year></date></history><copyright-statement>&#x00A9; Michele Tizzani, Yelena Mejova. Originally published in the Journal of Medical Internet Research (<ext-link ext-link-type="uri" xlink:href="https://www.jmir.org">https://www.jmir.org</ext-link>), 19.6.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.jmir.org/">https://www.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.jmir.org/2026/1/e88519"/><abstract><sec><title>Background</title><p>YouTube is the primary global video platform, hosting both authoritative health information and vaccine-skeptic viewpoints. However, engagement dynamics remain poorly understood.</p></sec><sec><title>Objective</title><p>The aim of this study was to investigate the temporal and textual dynamics of engagement of the YouTube viewership with vaccination content, and specifically content that is in favor of or against vaccination. We contextualized these dynamics in the authority signals of the posting channel and the moderation actions taken by the platform.</p></sec><sec sec-type="methods"><title>Methods</title><p>We conducted a 6-month daily longitudinal analysis of 7213 vaccine-related YouTube videos (November 2024 to May 2025) mentioning vaccination. We used zero-shot large language model classification with manual verification to classify the video stance toward vaccination, and the stance of their comments toward the video. The engagement and disagreement dynamics were modeled using Bayesian regression.</p></sec><sec sec-type="results"><title>Results</title><p>Our findings show engagement asymmetry between content supporting and questioning vaccination. Vaccine-hesitant videos in our sample receive substantially higher raw engagement (median likes: 40 [IQR 3-846] to 59 [IQR 3-1319]; median comments: 10 [IQR 0-160] to 18 [IQR 0-311] per video versus 3 [IQR 1-15] and 0 [IQR 0-4], respectively, for strongly provaccine content) and moderate normalized engagement rates (true median combined rate: 0.073 [IQR 0.028-0.121] to 0.069 [IQR 0.027-0.118] interactions per view versus 0.026 [IQR 0.007-0.060] for strongly pro-vaccine videos, a 2.5-2.6&#x00D7; difference). Descriptively, vaccine-hesitant videos reach 90% of cumulative views faster (18 [IQR 8-38] days vs 32 [IQR 18-64] days; 44% faster), while negative binomial models that adjust for total engagement volume indicate that approximately 20% of this advantage reflects genuine temporal compression independent of engagement volume. Comment analysis indicated that the vaccine-hesitant videos in our sample foster echo chambers, while the provaccine content attracts battlegrounds. Considering the sources of vaccine-related content, provaccine content tends to originate from organizations, particularly news and health institutions, while vaccine-hesitant discourse is more likely to come from individual creators, even those self-identifying as medical doctors. Moderation, on the rare occasion when it occurs (about 2% of the videos were taken down), comes after engagement saturation, limiting its effectiveness.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Our analysis suggests that the vaccine-hesitant content can dominate YouTube&#x2019;s engagement ecosystem through rapid early-stage amplification, which has direct implications for public health intervention timing and platform governance policy.</p></sec></abstract><kwd-group><kwd>vaccine hesitancy</kwd><kwd>YouTube</kwd><kwd>engagement dynamics</kwd><kwd>longitudinal analysis</kwd><kwd>Bayesian modeling</kwd><kwd>echo chambers</kwd><kwd>misinformation</kwd><kwd>social media</kwd><kwd>temporal patterns</kwd><kwd>public health policy</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Despite saving millions of lives [<xref ref-type="bibr" rid="ref1">1</xref>], vaccination has been a contentious public health issue, with hesitancy increasing globally since the COVID-19 outbreak [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. In 2025, the debate around vaccination became embedded in government policy and electoral politics (especially in the United States) following the strong politicization of the topic during the pandemic [<xref ref-type="bibr" rid="ref4">4</xref>]. While the acute phase of the pandemic has passed and the vaccination debate has been settled in the scientific community, the battle for public opinion is still underway, and it could reshape the long-standing public health policies. The discourse on vaccination is actively shaping the government&#x2019;s decisions, and in the United States, political movements are gaining traction, promising to &#x201C;Make America Healthy Again&#x201D; and framing vaccination as a political stance. Already, the United States is re-evaluating its role as a supporter of vaccine-based medicine both worldwide and domestically. The consequences are in evidence: the largest measles outbreak&#x2014;since its elimination status was achieved in 2000&#x2014;has reached 1431 cases and 3 deaths by September 2025 [<xref ref-type="bibr" rid="ref5">5</xref>].</p><p>This shifting policy landscape underscores the urgency of understanding online vaccine discourse. Social media platforms have become central battlegrounds in shaping public opinion, serving as both powerful tools for health communication and vectors for misinformation that can undermine public trust in vaccines [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Among these platforms, YouTube is a primary source of information for a global audience, making the quality and reception of its health content a matter of critical public concern. In 2025, the Pew Research Center found that the vast majority of US adults (84%) say they have ever used YouTube, and about half of them go on YouTube daily, and that it is the most widely used online platform among US teens [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>].</p><p>Prior research has established that YouTube hosts a mix of credible and misleading vaccine-related content, but none do so longitudinally. Earlier, Basch et al [<xref ref-type="bibr" rid="ref10">10</xref>] examined the 87 most widely viewed videos around vaccination safety and their creators, finding that 65.5% discouraged the use of vaccines. Then, in 2021, Tang et al [<xref ref-type="bibr" rid="ref11">11</xref>] created recommendation networks of pro- and antivaccine videos and found that when the user begins their session by searching provaccine keywords, they are recommended more videos by governmental agencies, hospitals, and academic institutions than when users search for antivaccine keywords. More recently, Ng et al [<xref ref-type="bibr" rid="ref12">12</xref>] &#x201C;gamified&#x201D; this analysis by asking real-world participants to intentionally find an antivaccine video when starting from the World Health Organization&#x2019;s posts, finding that less than 6% of the videos recommended by the algorithm were antivaccine. A most recent dataset&#x2014;albeit focusing on COVID-19&#x2014;was created by Jung et al [<xref ref-type="bibr" rid="ref13">13</xref>] using sock-puppets. They found that 31.5% of the top 10 search results contained COVID-19 misinformation, including that about vaccination. As exemplified above, not only do the studies in the existing literature use heterogeneous research designs, (intentionally) biased queries, and crawling starting points, they are, above all, limited by their <italic>cross-sectional</italic> nature (also including manually annotated surveys such as [<xref ref-type="bibr" rid="ref14">14</xref>]). They suggest that antivaccination content indeed exists on YouTube but fail to provide the full scope of posted vaccine-related content, and to capture the temporal dynamics of the actual users&#x2019; interaction with it.</p><p>Nonetheless, within this methodologically disparate landscape, we find a troubling trend: misleading or vaccine-hesitant videos often attract significantly more engagement&#x2014;in views, likes, and comments&#x2014;than accurate, provaccine videos [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. This &#x201C;engagement asymmetry&#x201D; aligns with broader findings that false news spreads faster and further than true news in online environments [<xref ref-type="bibr" rid="ref15">15</xref>]. Although YouTube has a medical misinformation policy [<xref ref-type="bibr" rid="ref16">16</xref>] that advises users not to post information that &#x201C;contradicts health authority guidance&#x201D; on the prevention and treatment of diseases, the stricter COVID-19 era policies have been phased out in 2023 [<xref ref-type="bibr" rid="ref17">17</xref>]. This leaves critical policy-relevant questions unanswered: How quickly does vaccine-hesitant content capture audience attention compared to provaccine content? And what is the nature of the discourse these different types of content foster?</p><p>Controversy around vaccination has been shown to be reflected on social media, such as Facebook and Twitter [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. Further, Gruzd et al [<xref ref-type="bibr" rid="ref20">20</xref>] documented Facebook-to-YouTube pathways that contributed to the spread of antivaccination content and formed clusters of densely connected videos. These areas of discourse, wherein information favors a certain stance while other views are excluded, are indicative of echo chambers [<xref ref-type="bibr" rid="ref21">21</xref>]. Note that the stance may be in favor or in opposition to some topic, such as vaccination, making possible echo chambers containing the majority opinion that disagrees with the medically established vaccination advice. Unfortunately, Gruzd et al [<xref ref-type="bibr" rid="ref20">20</xref>] did not capture possible disagreements within the comment-level discourse. On the other hand, Ekram et al [<xref ref-type="bibr" rid="ref22">22</xref>] found that comments on YouTube videos around the human papillomavirus vaccine often mentioned its potential side effects and conspiracy theories. Such spaces, wherein different or opposing points of view are discussed actively, can be viewed as a battleground or a controversy [<xref ref-type="bibr" rid="ref23">23</xref>]. Unfortunately, Ekram et al [<xref ref-type="bibr" rid="ref22">22</xref>] did not track the engagement temporally. In this work, we aim to combine quantitative, temporal, and qualitative text engagement signals to discover whether echo chambers or battlegrounds better characterize the vaccination debate on YouTube.</p><p>This dynamism is further complicated by the variety of actors posting health-related information on social media. Although public health institutions and researchers have joined the conversation, online influencers hold dominance by amassing vastly larger followings [<xref ref-type="bibr" rid="ref24">24</xref>]. Such competition for attention is especially acute during emergencies, exemplified by the beginning of the COVID-19 pandemic, when political and commercial interests competed with the public health messaging [<xref ref-type="bibr" rid="ref25">25</xref>]. The connection between the use of social media and higher vaccine hesitancy during this period has shown a robust negative impact on the vaccination efforts [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>], which cost an estimated thousands of lives [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. Given the high stakes, it is important to further understand the engagement dynamics around organizational accounts, in comparison to those of individuals who possibly have no medical credentials.</p><p>This study contributes a <italic>unique systematic daily longitudinal analysis</italic> of vaccine-related YouTube videos over a 6-month period. By tracking thousands of videos from the day of their upload through their engagement maturation, we provide a fine-grained temporal account of the online vaccine discourse. Unlike previous studies, which may confound engagement patterns with post hoc algorithmic amplification or viral surprises, this study focuses on the earliest phase of a video&#x2019;s lifecycle&#x2014;the initial engagement that occurs within the first few days and weeks of upload, when creators&#x2019; original reach and audience composition have the most direct influence. Our multifaceted approach combines scalable, large language model (LLM)&#x2013;based classification of video stances and comment agreement with Bayesian statistical modeling to answer three key questions:</p><list list-type="order"><list-item><p><italic>Temporal dynamics</italic>: How do the engagement trajectories of pro- and vaccine-hesitant videos differ over time?</p></list-item><list-item><p><italic>Discourse characterization</italic>: Do these different types of videos cultivate confirmatory &#x201C;echo chambers&#x201D; or contentious &#x201C;battlegrounds&#x201D; in their comment sections?</p></list-item><list-item><p><italic>Source effects</italic>: How do channel characteristics, such as topic and authority, moderate these discourse patterns?</p></list-item></list><p>We provide quantitative evidence that vaccine-hesitant content not only receives 10-fold higher raw engagement volume (and 3.1-fold higher per-view engagement rates) but also reaches its engagement peak faster than provaccine content (44% descriptively; 20% after controlling for engagement volume). Furthermore, through comment-level analysis, we demonstrate that this engagement follows distinct patterns: vaccine-hesitant videos foster agreeable echo chambers, while provaccine videos become contentious battlegrounds characterized by high levels of disagreement. These findings have significant implications for public health policy, platform governance, and science communication, highlighting the narrow window for effective intervention and the urgent need for context-aware communication strategies in an era of heightened vaccine policy contention.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Data Collection</title><p>The collection used in this study was created using a double-phase approach outlined in <xref ref-type="fig" rid="figure1">Figure 1</xref>. We adopt a &#x201C;streaming&#x201D; approach, wherein every day the collector takes 2 actions: it first uses a list of relevant keywords to search for videos published in the previous day and selects the videos that pass several filters for inclusion in the dataset, and then it periodically recollects the metadata about the selected videos.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Data collection pipeline overview: the daily collection and video selection (top) and periodic collection (bottom).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e88519_fig01.png"/></fig><p>Specifically, we use the YouTube Search application programming interface (API) [<xref ref-type="bibr" rid="ref30">30</xref>] to query for videos matching the following keyword list: <italic>vaccine</italic>, <italic>vaccination</italic>, <italic>novax</italic>, <italic>provax</italic>, <italic>antivaxx</italic>, <italic>antivaxxer</italic> (guided by previous work [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]). We restrict the time of collection to the previous day, the location to the &#x201C;US,&#x201D; and the language to English. The results are sorted by relevance, and we save the top 500. Next, we use the YouTube Video API [<xref ref-type="bibr" rid="ref33">33</xref>] to collect the metadata about the posted videos (note that it would be at most 1 day old), and the YouTube Transcript API library [<xref ref-type="bibr" rid="ref34">34</xref>] to download their transcripts. These videos are then filtered through several selection steps to make sure they contain enough content for analysis and that they are relevant to the topic of vaccination. We require that the videos have a transcript, be at least 1 minute and at most 60 minutes in duration, and that at least 1 keyword from the query can be found in their title or transcript, or at least 3 keywords can be found in the transcript, if none exist in the title. This filter results in about 8.3% (7213/86,387) of the videos passing (mostly because so many videos are very short, the analysis of which we leave for future studies).</p><p>During the periodic phase of the collection, we requery the metadata information about the videos daily in order to compose a temporal picture of the audience&#x2019;s engagement with them, as well as to capture any potential moderation actions taken by the platform. We perform this requerying every day for the first week after the video is initially retrieved, and following that, every week. After 3 months of collection, we consider whether in the past 2 time segments the counts of views, likes, or comments increase, and if they do not, we conclude the collection for those videos. During this collection, we also gather the 1000 most recent comments posted on that video using the comment Threads API, as well as the information about the poster of the video using the Channels API [<xref ref-type="bibr" rid="ref35">35</xref>]. The final dataset spans 6 months (November 20, 2024, to May 20, 2025) and is composed of 7213 videos posted by 3872 unique channels, and their accompanying 911,219 comments. Of the 7213 videos initially collected, 302 were excluded due to missing channel-level metadata (eg, hidden subscriber counts) or engagement timestamps required for the regression models, resulting in a final analytical dataset of 6074 videos.</p></sec><sec id="s2-2"><title>Content Characterization</title><sec id="s2-2-1"><title>Videos</title><p>As the focus of this study is to monitor the extent to which vaccine-hesitant content is present in such data, we endeavor to classify the collected videos according to their stance on vaccination [<xref ref-type="bibr" rid="ref36">36</xref>]. We begin by extracting excerpts from the video transcripts, of length 100 words, centered around the query keywords, which we then label (if more than 20 are found in a transcript, we randomly select 20). We then use the zero-shot classification via GPT-4o mini (OpenAI) to assign one of the following labels to each of the excerpts: &#x201C;in favor of vaccination,&#x201D; &#x201C;against vaccination,&#x201D; or &#x201C;not in favor or against vaccination,&#x201D; using the prompt shown in Section A.1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. This resulted in 55,310 annotated excerpts, an average of 8 per video. We validated this approach by manually annotating a random sample of 200 text segments. The agreement between the two authors of this study, computed on 60 segments, was near-perfect, at 96.7% (58/60) (Cohen &#x03BA;=0.94), with 2 instances of disagreement between the &#x201C;in favor of vaccine&#x201D; and &#x201C;not in favor or against vaccination&#x201D; classes. The accuracy of the zero-shot classifier was estimated at 82.5% (165/200) (a marked improvement compared to 70% achieved by standard natural language processing tools evaluated in previous literature [<xref ref-type="bibr" rid="ref37">37</xref>]). Per-class performance statistics can be seen in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. All of the errors were those with the middle label &#x201C;neither&#x201D; except for 4 instances where the disagreement was between the &#x201C;against vaccination&#x201D; and &#x201C;in favor of vaccination,&#x201D; suggesting that the main source of error may be due to the strength of the expressed stance. Next, we propagate these labels to the videos by considering the mean of the excerpt scores for each video, using the following encoding: &#x2212;1=against vaccination, 1=in favor of vaccination, and 0=neither in favor nor against. For the ease of interpretation and analysis, we categorize the continuous scores into the following: [0.5, 1]: &#x201C;strongly in favor&#x201D; (SIF); (0, 0.5): &#x201C;in favor&#x201D; (IF); [0]: &#x201C;neutral&#x201D; (N); (&#x2212;0.5, 0): &#x201C;against&#x201D; (A); and [&#x2212;1.0, &#x2212;0.5]: &#x201C;strongly against&#x201D; (SA) vaccines. This way, we were able to annotate 6074 videos posted by 3789 distinct users. The number of videos and channels in each category can be seen in the Results section.</p></sec><sec id="s2-2-2"><title>Comments</title><p>To characterize the discourse surrounding the videos, we annotate a sample of comments using a staged pipeline. We begin by filtering our video dataset to focus on the most engaged content, retaining only videos with at least 10 comments. From this filtered set, we randomly sample up to 50 comments per video for annotation. The sampled comments for each video are processed in a single batched API call to an LLM (GPT-4o mini). To determine the comment agreement with the video, the model is provided with the video&#x2019;s transcript and metadata as contextual reference (title, description, and transcript) and prompted to perform 2 analyses for each comment: first, to classify its agreement relative to the video&#x2019;s main claims (&#x201C;agree,&#x201D; &#x201C;disagree,&#x201D; or &#x201C;neutral/unrelated&#x201D;), and second, to determine its sentiment (&#x201C;positive,&#x201D; &#x201C;negative,&#x201D; or &#x201C;neutral&#x201D;). The model is also instructed to provide a brief rationale for each classification. The specific prompt used for this task is detailed in Section A.2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Further, the agreement label was annotated by the authors on a sample of 100 comments. Interannotator agreement, computed on 20 overlapping items, was <italic>k</italic>=0.66, indicating substantial agreement [<xref ref-type="bibr" rid="ref38">38</xref>].</p><p>Comparing the labels to those produced by the classifier, 73 labels match exactly, 17 disagree with a &#x201C;neutral/unrelated&#x201D; label, and the remaining 10 have the opposite disagreement (&#x201C;agree&#x201D; vs &#x201C;disagree&#x201D;). Upon manual examination, we find that the classifier often either misinterprets the stance of a long transcript or misses a contextual connection between mentioned parties that is not explicitly mentioned in the text. As the accuracy of the classifier is 90% if the &#x201C;neutral&#x201D; label is not considered an error, we proceed with the analysis, while keeping in mind the tool&#x2019;s limitations.</p><p>By using this zero-shot classification approach, we are able to scale our analysis to thousands of videos without relying on rigid keyword lists that might miss nuance. Conceptually, this method mimics human judgment regarding video stance and comment sentiment but applies it consistently across the entire dataset. This allows us to map the landscape of vaccine discourse with high granularity, ensuring that our distinction between &#x201C;provaccine&#x201D; and &#x201C;vaccine-hesitant&#x201D; content captures the true intent of the speaker rather than just the presence of specific medical terms.</p></sec><sec id="s2-2-3"><title>Channel Characterization</title><p>To understand the source of the videos in our dataset, we characterize the channels using a two-stage process: (1) an automated, hierarchical classification of the video&#x2019;s primary topic for each of the 3789 channels in the dataset, and (2) a manual annotation of the channel&#x2019;s creator type and declared authority signals for a subset of 645 channels.</p><sec id="s2-2-3-1"><title>Hierarchical Topic Classification</title><p>A substantial proportion of channels (278/3789, 7.3%) have multiple topic assignments from YouTube&#x2019;s metadata, reflecting the inherent multidimensionality of vaccine discourse [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref6">6</xref>]. To resolve these ambiguities for categorical analysis, we implement a 2-level hierarchical classification approach grounded in established cascade methodology [<xref ref-type="bibr" rid="ref39">39</xref>]. First, following cascade principles [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>], we use vaccine-related keywords to identify the broad topic category for each video, acknowledging that vaccine discourse cuts across multiple subjects [<xref ref-type="bibr" rid="ref22">22</xref>]. Second, to resolve remaining multitopic conflicts, we apply a specificity prioritization rule: politics &#x227B; society &#x227B; health. This hierarchy is theoretically grounded in hypernym-hyponym relationships from taxonomy theory [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref42">42</xref>], ensuring that more specific and discriminative categories (hyponyms like politics) are retained over broader ones (hypernyms like society or health). This ensures that more specific, discriminative categories are preserved over broader ones, collapsing ambiguous assignments into a single primary topic while retaining critical information about content framing [<xref ref-type="bibr" rid="ref39">39</xref>]. Details on the topic of co-occurrence statistics can be found in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-2-3-2"><title>Manual Annotation</title><p>For the second approach, we consider two samples of users: in the first are the channels that posted more than 3 videos in our dataset (339 channels), and the second sample includes channels that posted videos altogether totaling more than 10,000 views (451 channels). Combined, the two lists contain 645 unique channel IDs. The focus of the annotation is 2-fold: finding whether the channel associates itself with an organization or an individual, and what kinds of authoritative signals the channel projects. Such signals may include being a doctor, a news agency, or presenting expertise in the topics of health, science, or education. We also mark the channels that provide opinions, without mentioning other qualifications, and those centered around entertainment outside educational or scientific discourse. The page of each channel was examined and annotated manually. Seven channels were removed by the platform before they could be evaluated. Four were removed from further channel-related analysis due to a topical match, such as being about animals and mentioning animal vaccination.</p><p>By using both topical signals from YouTube and those from manual annotation, we provide a view of the authors of these videos both in terms of the narrative view of their presentation of the topic and in terms of their self-presentation as a possible authority on the subject.</p></sec></sec></sec><sec id="s2-3"><title>Engagement Metrics</title><sec id="s2-3-1"><title>Video-Level Analysis</title><p>To examine engagement patterns at the video level, we aggregated all metadata and computed normalized engagement rates. For each video <italic>v</italic>, the like ratio (LR) and comment ratio (CR) were defined as:</p><p>LR<italic><sub>v</sub></italic> = (video likeCount<italic><sub>v</sub></italic>)/(video viewCount<italic><sub>v</sub></italic>+1)</p><p>CR<italic><sub>v</sub></italic> = (video commentCount<italic><sub>v</sub></italic>)/(video viewCount<italic><sub>v</sub></italic>+1)</p><p>with extreme values clipped to the interval [0.001, 0.999] to satisfy the support of a beta regression. Stance labels&#x2014;SIF, IF, N, A, and SA&#x2014;were one-hot encoded, using neutral as the reference category. Channel-level covariates included the natural logarithm of the subscribers to the channels (LogSub) and the square root of the channels&#x2019; video counts (CHV):</p><p>LogSub<italic><sub>v</sub></italic> = ln(subscriberCount<italic><sub>v</sub></italic>)</p><p>CHV<italic><sub>v</sub></italic> = <inline-formula><mml:math id="ieqn1"><mml:msqrt><mml:mi>v</mml:mi><mml:mi>i</mml:mi><mml:mi>d</mml:mi><mml:mi>e</mml:mi><mml:mi>o</mml:mi><mml:mi>C</mml:mi><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>n</mml:mi><mml:mi>t</mml:mi></mml:msqrt></mml:math></inline-formula></p><p>capturing audience reach and channel activity. Temporal exposure, measured in days since publication, controlled for the decay of engagement over time. These features served as predictors in our beta regression models of normalized engagement rates.</p><p>For clarity, we refer to the total counts of views, likes, and comments per video as raw interaction volume, and to the LR and CR as normalized engagement rates (interactions per view).</p></sec><sec id="s2-3-2"><title>Comment-Level Analysis</title><p>We then characterized user engagement by studying the comments associated with each video. Our dataset initially consisted of 60,507 labeled individual comments. Videos with fewer than 5 annotated comments were excluded from the controversy analysis to ensure statistical reliability. Comments were categorized as agreeing, disagreeing (D), or N, and were used to compute entropy-based opinion diversity, or the controversy score (CS) [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]: CS<sub>v</sub>=<italic>H</italic>(C<sub>A</sub>, C<sub>D</sub>), where <italic>H</italic>(&#x00B7;) denotes Shannon entropy. Note that the measure portrays opinion heterogeneity, and not merely the existence of disagreement, making it possible that the comments are all in disagreement with the video, but homogeneously so, making the discussion not internally controversial.</p></sec></sec><sec id="s2-4"><title>Statistical Analysis</title><sec id="s2-4-1"><title>Models</title><p>To statistically test our hypotheses regarding engagement, temporality, and discourse characteristics, we used a Bayesian framework. This approach provides a direct probabilistic interpretation of model parameters and full posterior distributions quantifying uncertainty. All models were specified using a consistent set of predictors to ensure comparability: the video&#x2019;s stance label (with &#x201C;neutral&#x201D; as the reference category), the log-transformed subscriber count (LogSub), and the CHV.</p><p>We assigned weakly informative normal priors (<italic>&#x03B2;<sub>j</sub></italic> &#x223C; Normal(0<italic>,&#x03C3;</italic><sup>2</sup>)) to all regression coefficients to regularize estimates and prevent overfitting.</p></sec><sec id="s2-4-2"><title>Engagement Rate Models</title><p>To model the LR and CR, which are proportions bounded between 0 and 1, we specified a beta regression model for each, a standard approach for proportional outcomes, as it respects the bounded support of the data. For each video <italic>i</italic>, the engagement rate <italic>y<sub>i</sub></italic> is assumed to follow a beta distribution:</p><disp-formula><label>(1)</label><mml:math id="eqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x223C;</mml:mo><mml:mrow><mml:mi mathvariant="normal">B</mml:mi><mml:mi mathvariant="normal">e</mml:mi><mml:mi mathvariant="normal">t</mml:mi><mml:mi mathvariant="normal">a</mml:mi></mml:mrow><mml:mtext>&#x00A0;</mml:mtext><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msub><mml:mi>&#x03BC;</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:mi>&#x03BA;</mml:mi><mml:mo>,</mml:mo><mml:mtext>&#x00A0;</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:mn>1</mml:mn><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mi>&#x03BC;</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo stretchy="false">)</mml:mo><mml:mo>&#x22C5;</mml:mo><mml:mi>&#x03BA;</mml:mi></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>where the mean <italic>&#x00B5;<sub>i</sub></italic> is linked to the predictors via a logit link function:</p><disp-formula><label>(2)</label><mml:math id="eqn2"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mi>logit</mml:mi><mml:mo>&#x2061;</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>&#x03BC;</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mtext>label</mml:mtext><mml:mo stretchy="false">[</mml:mo><mml:mi>i</mml:mi><mml:mo stretchy="false">]</mml:mo></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mtext>LogSub</mml:mtext></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">L</mml:mi><mml:mi mathvariant="normal">o</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mi mathvariant="normal">S</mml:mi><mml:mi mathvariant="normal">u</mml:mi><mml:mi mathvariant="normal">b</mml:mi></mml:mrow><mml:mi>i</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mtext>CHV</mml:mtext></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">C</mml:mi><mml:mi mathvariant="normal">H</mml:mi><mml:mi mathvariant="normal">V</mml:mi></mml:mrow><mml:mi>i</mml:mi></mml:msub></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>The precision parameter <italic>&#x03BA;</italic> was assigned a broad half-normal prior. The exponentiated coefficients are interpreted as odds ratios (ORs), representing the multiplicative change in odds of engagement per unit increase in the predictor.</p></sec><sec id="s2-4-3"><title>Engagement Temporality Model</title><p>To model the speed of engagement, we predicted the number of days required to reach 90% of total engagement (<italic>P</italic>90). As this outcome is a positive integer count, we specified a <italic>negative binomial regression model</italic>, which is well-suited for overdispersed count data. The number of days <italic>d<sub>i</sub></italic> for video <italic>i</italic> is modeled as:</p><disp-formula><label>(3)</label><mml:math id="eqn3"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mi>d</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x223C;</mml:mo><mml:mtext>NegativeBinomial</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>&#x03BC;</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>;</mml:mo><mml:mi>&#x03B1;</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>where the mean <italic>&#x00B5;<sub>i</sub></italic> is linked to the predictors via a log link function, and <italic>&#x03B1;</italic> is the dispersion parameter:</p><disp-formula><label>(4)</label><mml:math id="eqn4"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mi>log</mml:mi><mml:mo>&#x2061;</mml:mo><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>&#x03BC;</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mtext>label</mml:mtext><mml:mo stretchy="false">[</mml:mo><mml:mi>i</mml:mi><mml:mo stretchy="false">]</mml:mo></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mtext>LogSub</mml:mtext></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:msub><mml:mtext>LogSub</mml:mtext><mml:mi>i</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mtext>CHV</mml:mtext></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:msub><mml:mtext>CHV</mml:mtext><mml:mi>i</mml:mi></mml:msub></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>To control for endogeneity&#x2014;specifically the mechanical correlation between low engagement volume and faster saturation&#x2014;we fit a sensitivity specification adding log-transformed total engagement (<italic>&#x03B2;</italic><sub>Vol</sub> &#x00B7; log(TotalViews<sub><italic>i</italic></sub>)) to the linear predictor. The exponentiated coefficients from these models are interpreted as incidence rate ratios (IRRs), representing the multiplicative change in expected days to reach P90.</p></sec><sec id="s2-4-4"><title>Discourse Characteristic Models</title><p>Finally, to analyze the nature of the comment section discourse, we fit two separate models.</p><p><italic>Disagreement model:</italic> To predict the proportion of disagreeing comments (<italic>prop</italic><sub>disagree</sub>), we used a beta regression model identical in structure to the engagement rate models (Equations 1 and 2).</p><p><italic>Controversy model:</italic> To predict the CS, which is a continuous, unbounded variable, we specified a standard <italic>Bayesian linear regression model</italic> assuming a normal (Gaussian) likelihood. For video <italic>i</italic>, the CS is modeled as:</p><disp-formula><label>(5)</label><mml:math id="eqn5"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mtext>CS</mml:mtext><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x223C;</mml:mo><mml:mtext>Normal</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>&#x03BC;</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>,</mml:mo><mml:msup><mml:mi>&#x03C3;</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo stretchy="false">)</mml:mo></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>where the mean <italic>&#x00B5;<sub>i</sub></italic> is directly modeled as a linear combination of the predictors:</p><disp-formula><label>(6)</label><mml:math id="eqn6"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mi>&#x03BC;</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mtext>label</mml:mtext><mml:mo stretchy="false">[</mml:mo><mml:mi>i</mml:mi><mml:mo stretchy="false">]</mml:mo></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mtext>LogSub</mml:mtext></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:msub><mml:mtext>LogSub</mml:mtext><mml:mi>i</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mtext>CHV</mml:mtext></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:msub><mml:mtext>CHV</mml:mtext><mml:mi>i</mml:mi></mml:msub></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>The coefficients (<italic>&#x03B2;<sub>j</sub></italic>) from this model represent the direct additive change in the CS score.</p><p>Bayesian models allow us to move beyond simple averages to understand the probability of engagement. In the results that follow, we report ORs to measure the likelihood of interaction; a value greater than one indicates that a video is more likely to receive likes or comments than neutral content. We also report IRRs for our timing analysis; here, a value less than one signifies a &#x201C;speedup,&#x201D; meaning the video accumulates its audience and saturates its engagement potential more rapidly than the baseline.</p><p>Additionally, we validate findings under frequentist statistical frameworks and assess sensitivity to model specification. Results and details appear in Sections B-E in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec></sec><sec id="s2-5"><title>Ethical Considerations</title><p>This observational study analyzed publicly available YouTube content collected via the official YouTube Data API v3; it involved no direct interaction with human participants. Consequently, institutional review board (IRB) approval was deemed unnecessary, and the research complies entirely with YouTube&#x2019;s Terms of Service. To protect user privacy, all individual usernames, user IDs, and identifying metadata associated with the comments were removed during data processing, and the comment text was deidentified. For transparency and reproducibility, examples of the public, high-profile YouTube channels analyzed in this study are listed in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. These channels represent public entities and major creators with no reasonable expectation of privacy regarding their broadcasted content.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Videos</title><sec id="s3-1-1"><title>Overview</title><p>We begin by examining the user engagement with the videos in our dataset. As can be seen in <xref ref-type="table" rid="table1">Table 1</xref>, more videos have been classified as either &#x201C;strongly in favor&#x201D; or &#x201C;in favor&#x201D; of vaccination, although there are around 1500 videos in the &#x201C;against&#x201D; and &#x201C;strongly against&#x201D; categories.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Video categories, score ranges, number of videos and channels in each category, and the proportion of videos to a channel. Note that the number of channels is presented per category and may overlap (the number of unique channels in the dataset is 3335).</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Category</td><td align="left" valign="bottom">Score range</td><td align="left" valign="bottom">Videos, n</td><td align="left" valign="bottom">Channels, n</td><td align="left" valign="bottom">Videos/channel</td></tr></thead><tbody><tr><td align="left" valign="top">Strongly in favor</td><td align="left" valign="top">[0.5, 1]</td><td align="left" valign="top">2492</td><td align="left" valign="top">1558</td><td align="left" valign="top">1.60</td></tr><tr><td align="left" valign="top">In favor</td><td align="left" valign="top">(0, 0.5)</td><td align="left" valign="top">1172</td><td align="left" valign="top">850</td><td align="left" valign="top">1.38</td></tr><tr><td align="left" valign="top">Neutral</td><td align="left" valign="top">[0]</td><td align="left" valign="top">996</td><td align="left" valign="top">796</td><td align="left" valign="top">1.25</td></tr><tr><td align="left" valign="top">Against</td><td align="left" valign="top">(&#x2013;0.5, 0)</td><td align="left" valign="top">602</td><td align="left" valign="top">437</td><td align="left" valign="top">1.36</td></tr><tr><td align="left" valign="top">Strongly against</td><td align="left" valign="top">[&#x2013;1.0, &#x2013;0.5]</td><td align="left" valign="top">812</td><td align="left" valign="top">585</td><td align="left" valign="top">1.39</td></tr></tbody></table></table-wrap></sec><sec id="s3-1-2"><title>Extent of Engagement</title><p>To establish the popularity of each video, we consider the last snapshot of its metadata that we have captured, which would be within a week of the end of the data collection period. <xref ref-type="fig" rid="figure2">Figure 2</xref> shows the distributions of the number of views, likes, and comments for the videos in each of the 5 categories. The vertical lines signify the median value of the distribution, which is also shown in the upper right of each plot, as well as the mean. Because the distributions are heavy-tailed, the mean is affected by the few popular outliers and is thus sometimes several orders of magnitude larger than the median. Note that we are witnessing the videos at different times from their posting. Even though on average the videos labeled as &#x201C;against&#x201D; or &#x201C;strongly against&#x201D; are slightly &#x201C;older&#x201D; (mean 86 [SD 48] and mean 82 [SD 48], respectively) than those labeled as &#x201C;in favor&#x201D; or &#x201C;strongly in favor&#x201D; (mean 98 [SD 50] and mean 87 [SD 51], respectively), the standard deviations are so large that the effect of video age is negligible when comparing distributions within label categories.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Distributions of video engagement by stance, shown in raw counts and normalized rates. (A) Log-log frequency plots for views, likes, and comments; dashed vertical lines indicate the median. The y-axis represents the number of videos. Vaccine-hesitant stances (&#x201C;A&#x201D; and &#x201C;SA&#x201D;) tend to have higher median engagement counts. (B) Histograms of normalized like ratio (LR) and comment ratio (CR), the y-axis represents the percentage of videos within each bin. Distributions for &#x201C;A&#x201D; and &#x201C;SA&#x201D; stances are shifted to the right, indicating a higher rate of engagement per view compared to provaccine (&#x201C;SIF&#x201D; and &#x201C;IF&#x201D;) and neutral (&#x201C;N&#x201D;) stances. A: against; IF: in favor; N: neutral; SA: strongly against; SIF: strongly in favor.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e88519_fig02.png"/></fig><p>Using all 3 metrics of engagement, we find that the videos in the A and SA categories receive much more attention than those IF and SIF categories. The difference in median views, for instance, differs by an order of magnitude from &#x201C;strongly against&#x201D; at 1065 (IQR 55-14,559) to &#x201C;strongly in favor&#x201D; at 135 (IQR 26-690). The views of &#x201C;against&#x201D; videos are even greater, at the median of 2051 (IQR 50-21,167). Further, 24.7% (615/2492) of the videos in the &#x201C;strongly in favor&#x201D; category received no likes at all, compared to 13.2% (107/812) of those in the &#x201C;strongly against&#x201D; category. The situation is even more dire for comments&#x2014;a more strenuous action than a like&#x2014;wherein the disparity is at 52.2% (1300/2492) compared to 27.5% (223/812), respectively. When normalized by views, these differences translate to substantial engagement asymmetries: vaccine-hesitant videos (&#x201C;against&#x201D; and &#x201C;strongly against&#x201D;) have median like ratio of 0.056 and 0.058 (ie, 5.6 and 5.8 likes per 100 views), respectively, compared to 0.020 for strongly in favor videos&#x2014;a 2.8- to 2.9-fold engagement advantage. Combined raw interaction volume (likes+comments) yields approximately 10-fold higher engagement for vaccine-hesitant content (see Table S7 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for detailed comparison).</p></sec><sec id="s3-1-3"><title>Statistical Analysis</title><p>To provide a comprehensive statistical account of online vaccine discourse, we fit a series of Bayesian regression models predicting 3 key outcomes: engagement rates, engagement temporality, and discourse characteristics. The posterior distributions for the coefficients of each model are visualized in <xref ref-type="fig" rid="figure3">Figure 3</xref>. All comparisons are made relative to a neutral video stance. All model parameters converge (<italic>R</italic>&#x2248;1 for all variables).</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Posterior distributions of coefficients from Bayesian models of engagement and discourse. The figure summarizes the results of 3 sets of Bayesian regression models. Ridge plots show the posterior probability distribution for each predictor&#x2019;s effect size on the logit (for rates) or log (for counts) scale. Horizontal bars represent the 94% highest density interval (HDI). A distribution to the right of the zero line indicates a positive association; to the left indicates a negative association. (A) Engagement: models predicting the like ratio and comment ratio. (B) Days to 90% of engagement: models predicting the number of days to reach 90% of total views, likes, or comments. A negative coefficient signifies a faster trajectory. (C) Discourse characteristics: models predicting the proportion of disagreeing comments and the controversy score (CS). The channel video counts (CHV) variable had no significant effect for all the models; it is not shown in the plots. Even when controlling for channel size, vaccine-hesitant stances are the strongest predictors of high normalized engagement rates and accelerated temporal saturation. A: against; IF: in favor; SA: strongly against; SIF: strongly in favor.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e88519_fig03.png"/></fig><p><xref ref-type="fig" rid="figure3">Figure 3A</xref> displays the predictors for LR and CR. The results show a clear divergence in how audiences interact with pro- versus vaccine-hesitant content. For the like ratio model, we find strong evidence that vaccine-hesitant stances are associated with higher rates of likes compared to neutral content. The odds of a viewer liking a SA video are approximately 1.8% higher (OR 1.018, 94% highest density interval [HDI] 1.012-1.024), and 1.3% higher for an A video (OR 1.013, 94% HDI 1.007-1.020). The credible intervals for both coefficients are entirely above 1.0, indicating high certainty in the positive effect. Conversely, the IF stance is associated with a statistically credible decrease in the odds of receiving a like, with the odds being 0.8% lower (OR 0.992, 94% HDI 0.986-0.997). The effect for SIF is more uncertain, with a credible interval that just touches an OR of 1.0 (94% HDI 0.991-1.000).</p><p>The comment ratio model indicates that vaccine-hesitant content is most effective at stimulating discussion. Both A and SA stances are associated with a small but certain increase in the odds of commenting, with ORs of 1.008 (94% HDI 1.004-1.012) and 1.007 (94% HDI 1.003-1.011), respectively. The effects for provaccine stances (SIF and IF) are centered precisely on an OR of 1.0, with credible intervals that broadly overlap 1.0, indicating their effect on the comment ratio is indistinguishable from that of neutral content. Across both models, the channel characteristics LogSub and CHV showed very small and uncertain effects. Collectively, these models provide quantitative evidence that vaccine-hesitant content is more successful at generating positive feedback (likes), while also being slightly more effective at stimulating discussion (comments).</p><p>To validate these findings under alternative statistical frameworks, we conducted robustness checks using logit-ordinary least squares regression with heteroskedasticity-consistent (HC3) standard errors (Section B in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><p>These models statistically confirm that the &#x201C;engagement advantage&#x201D; of vaccine-hesitant content is not a random artifact. The data show that a user watching a vaccine-skeptic video is significantly more likely to click &#x201C;like&#x201D; or leave a comment than a user watching a provaccine video, regardless of the channel&#x2019;s size. This suggests that hesitant narratives are inherently more effective at eliciting active feedback from their audience.</p></sec></sec><sec id="s3-2"><title>Engagement Over Time</title><p>Next, we take advantage of the regular requerying of the engagement statistics to examine the temporal trend of the views, likes, and comments the video receives after its posting. <xref ref-type="fig" rid="figure4">Figure 4</xref> shows the trajectories of views, likes, and comments of the videos in each of the label categories. For each statistic, we also compute an average trajectory line and show it in color. We also show (by the vertical line) the number of days at which the average trajectory reaches 90% (P90) of the statistic. For instance, videos labeled as &#x201C;strongly in favor&#x201D; on average reach 90% of their views at day 32 (IQR 18-64), whereas those labeled as &#x201C;strongly against&#x201D; reach it at day 18 (IQR 8-38).</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>The engagement &#x201C;trajectories&#x201D; showing the percentage of views, likes, or comments (see row labels) the video achieves over days (x-axis), by label category (shown above each plot). The trajectories for each day are in light gray, and the average trajectory is in color. The vertical bar marks the number of days at which the average trajectory reaches 90% of the statistic. For likes and comments, videos are limited to those having more than 1 like or comment, respectively. Vaccine-hesitant content saturates significantly faster (median 18 days) than provaccine content (median 32 days), creating a narrow window for effective public health counter-messaging. A: against; IF: in favor; N: neutral; P90: 90% of total engagement; SA: strongly against; SIF: strongly in favor.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e88519_fig04.png"/></fig><p>Although it is not possible for views to decrease over time, it is possible for the number of likes or comments to decrease when a like is unselected or a comment is deleted. This introduces some noise, especially for those videos that have only one comment or like. For this reason, the analysis of the likes and comments includes only videos that had more than 1 like or comment (respectively) in our dataset. See Section H in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for plots that include all videos, as well as the same statistics at thresholds 5 and 10.</p><p>Considering all of the engagement metrics, we find that the videos labeled as &#x201C;against&#x201D; or &#x201C;strongly against&#x201D; vaccination reach their peak engagement sooner than those in favor. Visually, the trend lines become sharper at the &#x201C;knee&#x201D; (where the distribution starts reaching a plateau). The pattern remains similar at thresholds 5 and 10 (see Section H in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), though the magnitude of the difference between &#x201C;strongly in favor&#x201D; and &#x201C;strongly against&#x201D; decreases in the case of comments, which are sparser than likes.</p><p>To quantitatively characterize the temporal saturation of engagements, we use a nonnegative binomial Bayesian model. The center panel of <xref ref-type="fig" rid="figure3">Figure 3B</xref> models the speed at which videos accumulate their audience, predicting the number of days required to reach 90% of total engagement (P90). The results from our Bayesian negative binomial models show that vaccine-hesitant content reaches its engagement peak significantly faster than neutral or provaccine content. For the trajectory of likes, videos with an A stance are expected to reach their P90 approximately 24% faster than neutral videos (IRR 0.76, 94% HDI 0.658-0.864). Similarly, SA videos are approximately 20% faster (IRR 0.80, 94% HDI 0.705-0.905).</p><p>In contrast, provaccine content exhibits a slower rate of engagement accumulation. SIF videos are predicted to take approximately 12% longer to reach their P90 peak (IRR 1.12, 94% HDI 1.016-1.242), with a credible interval entirely above 1.0. The effect for IF videos is indistinguishable from neutral content (IRR 0.99, 94% HDI 0.882-1.112). These patterns were consistent across the models for views, likes, and comments. Furthermore, we found a strong effect for channel size, with each unit increase in LogSub associated with a trajectory that is approximately 17% faster (IRR 0.83, 94% HDI 0.803-0.856), suggesting that videos from larger channels accumulate their engagement more quickly.</p><p>To address endogeneity of temporal saturation, we conducted a sensitivity analysis by refitting the negative binomial P90 models with additional control for log-transformed total views. This specification tests whether stance effects on days-to-saturation reflect genuine timing asymmetries or merely mechanical confounding. The mechanism of potential confounding is straightforward: videos receiving fewer total likes or views will, by definition, reach a 90% engagement threshold sooner than videos with higher engagement ceilings. If stance predicts both engagement volume and timing, the observed temporal asymmetry could be entirely mechanical rather than reflecting genuine differences in how quickly vaccine-hesitant versus provaccine content accumulates engagement.</p><p>The controlled models substantially attenuated the stance effects on P90 days. For &#x201C;strongly against&#x201D; videos, IRR for temporal saturation decreased from 0.56 (44% faster saturation; 94% HDI 0.50-0.62) in the uncontrolled baseline model to 0.80 (20% faster saturation; 94% HDI 0.70-0.90) after controlling for log(TotalViews). This 24 percentage point reduction represents substantial confounding. The control variable itself had a positive coefficient (IRR 1.042, 94% HDI 1.021-1.061), meaning that videos accumulating more total engagement reached P90 more slowly, consistent with a pattern of sustained engagement growth rather than front-loaded spikes. Approximately 54% of the uncontrolled 44% effect appears attributable to mechanical confounding, while 46% persists as a genuine timing advantage. This controlled estimate of 20% faster saturation for vaccine-hesitant content represents a more conservative but still substantial temporal asymmetry, indicating that these videos not only receive less total engagement but also concentrate their engagement into a shorter time window relative to their final engagement level. All parameters achieved acceptable convergence (<italic>R</italic> &#x003C;1.01). Detailed results are shown in Section G in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><p>In summary, we find that vaccine-hesitant content has a &#x201C;speed advantage.&#x201D; By raw timing, while provaccine content accumulates its audience gradually over a month (32 days to P90), vaccine-hesitant content experiences a concentrated burst of activity, saturating within 18 days (44% faster). However, a portion of this temporal advantage reflects mechanical confounding: videos with lower total engagement reach absolute thresholds sooner by definition. Sensitivity analysis controlling for log-transformed total engagement attenuates the effect from 44% to 20% faster saturation, indicating that approximately 54% of the raw temporal advantage reflects mechanical confounding while 46% persists as genuine temporal compression. This means vaccine-hesitant videos not only receive lower total engagement but also concentrate what engagement they receive into a narrower time window relative to their eventual engagement ceiling. Both the 44% practical effect and the 20% controlled effect have policy relevance: practitioners face the 44% saturation speed; researchers identify a 20% genuine temporal compression. This rapid early-stage lifecycle implies that the digital footprint of hesitant content is established quickly, suggesting that the window for effective counter-messaging or moderation is much narrower for this type of content.</p><p>In summary, the 18-day versus 32-day difference corresponds to a descriptive 44% faster saturation for vaccine-hesitant content, whereas the controlled IRR from the negative binomial model corresponds to a more conservative model-based estimate of 20% faster saturation after adjusting for total engagement volume.</p></sec><sec id="s3-3"><title>Comments</title><p>Beyond the quantity of audience interaction, we aimed to understand its nature. To this end, we classified comment stances relative to the video&#x2019;s own stance, analyzing the results in aggregate, by channel topic, and through the CS.</p><p>The aggregate results, shown in the &#x201C;all categories&#x201D; plot in <xref ref-type="fig" rid="figure5">Figure 5A</xref>, show that videos with SA and A stances are more likely to foster echo chambers; their comment sections are dominated by agreement, with 39.9% (6184/15,508) and 35.6% (6055/17,030) of comments agreeing, respectively (with only 18.6% (2889/15,508) and 25.7% (4379/17,030) disagreeing). In contrast, videos with SIF and IF stances attract significant contention, with higher disagreement rates of 35.9% (2751/7650) and 31.7% (2362/7440) and lower agreement rates of 24.4% (1870/7650) and 27.8% (2072/7440). This suggests that while vaccine-hesitant content fosters confirmatory engagement, provaccine content often serves as a &#x201C;battleground&#x201D; for public debate. Disaggregating by authority, we see that the &#x201C;battleground&#x201D; effect is most intense in health and entertainment (eg, 47.4% [138/291] disagreement on SIF health videos), while the knowledge topics (like doctor) appear more balanced, with &#x201C;strongly in favor&#x201D; videos attracting the highest rate of agreement (422/820, 51.5%) for any provaccine content.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Comment agreement proportion by video stance, faceted by channel characteristics. The figure displays the normalized proportion of comment stances (D: disagree; N: neutral; A: agree) for videos, broken down by various channel categorizations. Each horizontal bar shows the proportion of comment types for a specific video stance (SIF: strongly in favor; IF: in favor; N: neutral; A: against; SA: strongly against) within that category. (A) Panels show distributions for channels grouped by their primary content category (eg, health and politics). (B) Panels show distributions for channels grouped by their declared authority (eg, doctor and news). (C) Panels show distributions for channels grouped by their institution type (individual, organization, other). Vaccine-hesitant videos function as confirmatory &#x201C;echo chambers&#x201D; (high agreement), while provaccine health videos serve as &#x201C;battlegrounds&#x201D; characterized by high levels of disagreement.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e88519_fig05.png"/></fig><p>These patterns are further explored in the ternary plots of <xref ref-type="fig" rid="figure6">Figure 6A</xref>, which visualize the distribution of individual videos in the tree level of agreement. Vaccine-hesitant videos (colored red and orange) mostly cluster in the top &#x201C;agree&#x201D; corner, providing strong visual evidence of echo chambers, particularly in the politics and society topics. Provaccine videos (colored blue) are distributed more broadly, with a significant concentration extending toward the bottom-left &#x201C;disagree&#x201D; corner and into the central battleground region, confirming their role as contentious battlegrounds.</p><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>Visualizing discourse patterns through comment agreement distributions. This figure presents 3 perspectives on how audience agreement varies by video stance and topic. (A) A ternary plot visualizes each individual video&#x2019;s discourse pattern, colored by its own stance (red=strongly against, blue=strongly in favor). The top corner represents high agreement (&#x003E;60%), the bottom-left corner represents high disagreement (&#x003E;60%), and the bottom-right represents neutrality. Dashed lines demarcate &#x201C;echo chambers&#x201D; (areas where a single stance dominates &#x003E;60% of comments). Vaccine-hesitant videos (red) cluster heavily in the top &#x201C;agree&#x201D; echo chamber, particularly in society and politics. Provaccine videos (blue) are dispersed toward the bottom-left &#x201C;disagree&#x201D; corner and the center. N: neutral; SA: strongly against; SIF: strongly in favor. (B) The same distribution colored by controversy score (CS). Deep purple indicates high controversy (high entropy), corresponding to the &#x201C;battleground&#x201D; region in the center of the triangle where no single sentiment dominates. Bright teal indicates low controversy, aligning with the echo chambers at the corners. The platform simultaneously hosts an insulated agreement and intense public contention, mediated by the video&#x2019;s stance.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e88519_fig06.png"/></fig><p>Building on these observed patterns, we then colored the same distribution by the CS to quantify the level of contention (<xref ref-type="fig" rid="figure6">Figure 6B</xref>). The results confirm that the CS effectively captures the distinction between echo chambers and battlegrounds. The lowest controversy scores (bright teal) are heavily concentrated in the corners of the plots, particularly the top &#x201C;agree&#x201D; corner, aligning with the confirmatory echo chambers identified in the vaccine-hesitant videos. In contrast, the highest controversy scores (deep purple) are found in the center of the triangle, corresponding to the &#x201C;battleground&#x201D; videos that attract a chaotic mix of agreeing, disagreeing, and neutral comments. By comparing the topic-specific panels, we can see that the health topic contains a prominent cluster of high-controversy (purple) videos in its center, quantitatively confirming it is the most contentious domain. This shows that the CS metric captures the observed discourse patterns, mapping high consensus to low controversy and high conversational diversity to high controversy.</p><p><xref ref-type="fig" rid="figure3">Figure 3C</xref> analyzes the nature of the comment section itself by modeling the proportion of disagreement and the CS. The results statistically confirm our &#x201C;battleground vs echo chamber&#x201D; hypothesis with quantitative evidence. In the <italic>disagreement model</italic>, provaccine stances are associated with a higher likelihood of attracting dissent. Compared to neutral videos, a SIF stance increases the odds of a comment disagreeing by approximately 5% (OR 1.05, 94% HDI 1.003-1.094). In contrast, a SA stance is associated with a decrease in the odds of disagreement by about 7% (OR 0.93, 94% HDI 0.898-0.972), with its credible interval falling entirely below 1.0. This provides strong statistical evidence that SA videos foster more agreeable, echo-chamber-like environments.</p><p>The <italic>controversy score model</italic> further clarifies this dynamic. The SIF stance is associated with a statistically credible decrease in the CS of approximately 0.075 units (94% HDI &#x2013;0.119 to &#x2013;0.033) compared to neutral content. At first glance, this seems counterintuitive. However, it suggests that while SIF videos attract more direct disagreement (a 2-way debate), neutral videos foster a more chaotic and unpredictable mix of &#x201C;agree,&#x201D; &#x201C;disagree,&#x201D; and &#x201C;neutral&#x201D; comments. The CS metric captures entropy, not just disagreement: perfectly balanced agree/disagree comments have lower CS than chaotic agree/disagree/neutral mixtures. Thus, more focused contention (SIF videos) can have lower CS than less predictable patterns. The effects of other stances (IF, A, SA) on the CS are uncertain, with credible intervals that all broadly overlap zero. Across both models, channel size (LogSub) has a significant positive effect, indicating that videos from larger channels tend to host both more disagreeable and more broadly controversial debates.</p><p>Our analysis delineates 2 distinct social environments coexisting on the platform. Vaccine-hesitant videos function largely as &#x201C;echo chambers&#x201D; where users reinforce each other&#x2019;s views with high agreement. In contrast, provaccine videos&#x2014;especially those from health institutions&#x2014;function as &#x201C;battlegrounds&#x201D; characterized by debate and dissent. This distinction is crucial for interpretation, as it clarifies that high engagement numbers on provaccine content often reflect controversy and argument rather than consensus or support.</p></sec><sec id="s3-4"><title>Channels</title><p>Next, we show that the provaccine and vaccine-hesitant content largely originates from two distinct creator ecosystems. This section details the evidence for this sourcing asymmetry by examining the topical framing, authority signals, and institutional identity of the channels in our dataset.</p><p>To contextualize our findings, we first characterized the topical composition of the 7213 videos using the categories of the posting channel. Using a hierarchical resolution of YouTube&#x2019;s metadata, we categorized videos into 3 primary topics: health (4027/6074, 66.3%), politics (918/6074, 15.1%), and society (628/6074, 10.3%). This hierarchical approach was necessary due to the prevalence of multitopic assignments in the original metadata (71.8% of videos), reflecting the inherently multidimensional nature of vaccine discourse. As shown in our subsequent analyses, this topical framing emerges as a significant moderator of engagement and comment discourse.</p><p>The distribution of video stances across these channel characteristics is presented in <xref ref-type="fig" rid="figure7">Figure 7</xref>. By topic (<xref ref-type="fig" rid="figure7">Figure 7A</xref>), health-related videos are slightly more provaccine (49.3% [1987/4027] &#x201C;strongly in favor&#x201D; and 21% [847/4027] &#x201C;in favor&#x201D;), whereas politics and society topics show more balanced distributions. This suggests health-framed discussions may attract greater institutional participation, while politics and society frames host a more diverse set of creator viewpoints.</p><fig position="float" id="figure7"><label>Figure 7.</label><caption><p>Share of videos posted by channels with certain labels per channel categories found in the metadata (A) and per authority (B) and institution (C) labels manually annotated on a subset of 645 channels. Provaccine discourse is dominated by institutional voices (news/health organizations), whereas vaccine-hesitant content is driven by individual creators, including self-identified medical doctors who bypass institutional constraints. A: against; IF: in favor; N: neutral; SA: strongly against; SIF: strongly in favor.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e88519_fig07.png"/></fig><p>This pattern is further intricate when considering the authority of a channel&#x2019;s signals extracted via manual annotation (<xref ref-type="fig" rid="figure7">Figure 7B</xref>). Channels identified as news or about health predominantly post content in favor of vaccination, with 66% (870/1318) and 77.7% (237/305) falling into the combined &#x201C;strongly in favor&#x201D; and &#x201C;in favor&#x201D; categories, and with minimal representation in the strongly against category. In contrast, channels run by (self-declared) doctors post content both in support and against vaccination. Finally, entertainment and opinion channels display the most heterogeneous distributions, including significant portions of antivaccine content, suggesting these creators serve diverse audiences, often without the institutional constraints that guide health or news organizations.</p><p><xref ref-type="fig" rid="figure7">Figure 7C</xref> shows a clear distinction between organizational and individual creators. Organizations are more represented in provaccine content production (1103/1598, 69%) of their videos fall in the &#x201C;strongly in favor&#x201D; and &#x201C;in favor&#x201D; categories combined, versus only 10.8% (172/1598) in &#x201C;strongly against,&#x201D; whereas individual creators exhibit greater stance diversity. Only 18.6% (132/708) of videos from individual creators are &#x201C;strongly in favor,&#x201D; while 25.1% (178/708) are &#x201C;strongly against,&#x201D; pointing to the need for engagement with individual posters to tackle such content.</p><p>These distributional patterns are reflected in the composition of the most prolific channels in our dataset (Section I in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The 10 channels that posted the most videos are responsible for just 5% of the total volume (Gini=0.39), indicating that the content is not dominated by a few voices. This list includes a mix of news organizations, such as CTV and 9NEWS, which primarily post provaccine content, alongside individual creators like a self-described doctor or a showman, who are significant contributors to the vaccine-hesitant discourse. This mix illustrates the broader patterns in action: news media are an important contributor of vaccine-related content, but influencers and alternative voices have a strong and countervailing presence.</p><p>Finally, we investigated how the source of a video impacts audience discourse by analyzing comment agreement patterns across these channel types (<xref ref-type="fig" rid="figure5">Figure 5B,C</xref>). The results show that the nature of the creator significantly shapes the comment section&#x2019;s dynamics. Within the Authority categorization, for instance, health channels exhibit the most polarized reactions, fostering strong echo chambers for &#x201C;strongly against&#x201D; videos (82% agreement) while their &#x201C;strongly in favor&#x201D; videos become &#x201C;battlegrounds&#x201D; (50% disagreement). When categorized by institution, a clear distinction appears: videos from organizations tend to generate stronger echo chambers, especially for vaccine-hesitant content, while individual creators host more balanced and contentious conversations across the board.</p><p>In summary, the analysis of channel characteristics shows that provaccine and vaccine-hesitant content largely originates from two distinct creator ecosystems. The provaccine discourse is predominantly driven by organizations, particularly news and health institutions, which reach cohesive audiences. In parallel, the vaccine-hesitant discourse is more strongly represented by a diverse array of individual creators, who foster more contentious and heterogeneous comment sections. This fundamental divergence in sourcing is crucial for understanding why these two types of content exhibit such different engagement dynamics and foster such different online communities.</p></sec><sec id="s3-5"><title>Moderation</title><p>In the course of the collection, 243 videos at some point failed to return metadata results during the periodic recollection efforts. We manually examined the errors the YouTube interface provided for these, and found that for 116, the platform simply tells the users that the &#x201C;This video isn&#x2019;t available anymore,&#x201D; 66 have been made private by the uploader, 50 were unavailable due to the posting account having been terminated by the platform, 3 were removed by the uploader (a message distinct from the video simply being unavailable), 6 were removed due to violating YouTube&#x2019;s Community Guidelines or Terms of Services, one because the uploader has closed their YouTube account, and one because of a copyright claim. We consider the video disappearances attributed to the author separately from all others (which we attribute to the platform), and find the rates shown in <xref ref-type="fig" rid="figure8">Figure 8</xref>. We find that the removals by the author of the video happen more for &#x201C;strongly in favor&#x201D; and &#x201C;in favor&#x201D; videos, whereas videos labeled as &#x201C;against&#x201D; or &#x201C;strongly against&#x201D; were more likely to be removed by the platform.</p><fig position="float" id="figure8"><label>Figure 8.</label><caption><p>Percentage of videos in each stance that have been removed. Bars distinguish between videos made private or deleted by the uploader (by author) and those taken down for guideline violations (by platform). A: against; IF: in favor; N: neutral; SA: strongly against; SIF: strongly in favor.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v28i1e88519_fig08.png"/></fig><p>Considering the error codes more closely, we find that all videos removed due to violating YouTube&#x2019;s Community Guidelines were either labeled as &#x201C;against&#x201D; or &#x201C;strongly against.&#x201D; On the other hand, videos that belonged to channels terminated by the platform span all 5 categories. Whenever the video was made private by its author, the label is more likely to be &#x201C;in favor&#x201D; or &#x201C;strongly in favor&#x201D; (77.3% [51/66] of such videos) than &#x201C;against&#x201D; or &#x201C;strongly against&#x201D; (9/66, 13.6%). Thus, we find a variety of reasons for the disappearance of videos, with some evidence of the platform&#x2019;s policies affecting more the vaccine-skeptic side when it comes to sanctioning content, but not necessarily the accounts themselves.</p><p>The median time of the video disappearing is 14.4 (IQR 4.9-35.8) days from its posting, meaning that half of the videos were taken down within that time. However, many remained until almost the end of our 3-month collection period, pointing to a low but constant level of moderation across time. Since most of the interactions with the video happen within the first few weeks of a video&#x2019;s posting, this policy likely fails to stem the majority of the video&#x2019;s impact.</p><p>Upon the examination of the metadata collected for the videos of accounts terminated by the platform (as the videos themselves were not available at the time of the analysis), we find that they largely consist of vaccine-skeptic, anti-establishment content, as well as likely semiautomated channels that repost news snippets. Those labeled as &#x201C;in favor&#x201D; of vaccines sometimes use sensationalized language, such as &#x201C;The truth might SHOCK you!&#x201D; (such phrases are often considered &#x201C;clickbait&#x201D; to attract an audience). Some also engage in &#x201C;keyword stuffing&#x201D; by including many keywords in the description of the video to increase the chance of attaining a higher rank during a search. Yet other accounts mention vaccination in the context of providing other information, such as a channel promoting US visas. Unfortunately, beyond the error message, we cannot obtain any additional information on why these accounts might have been removed; however, the above observations exemplify the low-quality content that public health institutions compete with on this platform. The last engagement information our data collection captured for these removed videos reflects the overall trend of videos against vaccination, showing more engagement than those in favor (see Section J in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Context</title><p>Prior YouTube vaccine studies have shown that vaccine-hesitant content receives more engagement than provaccine ones [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref44">44</xref>]. However, these snapshot-based analyses reveal only an engagement gap, leaving unanswered when and how fast this gap widens. By tracking engagement longitudinally, we document a previously unquantified temporal asymmetry: vaccine-hesitant videos saturate engagement significantly faster than provaccine content (44% faster in raw timing; 20% faster in model-based estimates that control for engagement volume). Furthermore, we challenge the assumption that polarization is symmetric [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]. Our comment analysis demonstrates that vaccine-hesitant videos function as agreeable echo chambers [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref46">46</xref>], whereas provaccine videos act as contentious battlegrounds. This suggests the platform hosts two distinct discourse architectures simultaneously, mediated by content stance.</p><p>Importantly, our analysis is purely observational: we do not observe recommendation paths or run interventions, and therefore we cannot identify causal effects of YouTube&#x2019;s ranking or recommendation systems; we interpret our results as patterns of realized engagement rather than causal impacts of specific algorithms.</p></sec><sec id="s4-2"><title>Engagement Asymmetry and the Temporal Window for Intervention</title><p>By quantifying engagement dynamics, we observe that vaccine-hesitant videos attract substantially higher normalized engagement rates (2.8 to 2.9&#x00D7; higher) and reach saturation significantly faster than provaccine content. This temporal dimension suggests that vaccine-hesitant content gains traction not through sustained growth, but through rapid early-stage saturation. While the observed speed advantage (44% faster descriptively) is partly driven by lower engagement ceilings, a genuine temporal compression persists even after controlling for this confounding (20% faster after controlling for total engagement). This distinction between threshold-crossing speed and engagement velocity deserves deeper attention.</p><p>The decomposition of this temporal asymmetry shows distinct audience dynamics. The portion of the speedup attributable to confounding indicates that vaccine-hesitant audiences are smaller but more efficient: they mobilize quickly from a self-selected pool, producing a &#x201C;peak-and-plateau&#x201D; dynamic characteristic of viral misinformation [<xref ref-type="bibr" rid="ref47">47</xref>]. Unlike provaccine content, which accumulates engagement incrementally as it diffuses through heterogeneous networks, vaccine-hesitant content exhibits the rapid consolidation typical of echo chambers [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref48">48</xref>]. This aligns with our comment-level findings: the structural homogeneity of the vaccine-skeptic audience facilitates rapid, confirmatory engagement, while the heterogeneity of the provaccine audience results in slower, contentious accumulation.</p><p>These findings identify a mechanism-specific temporal signature. Prior work established that false news spreads faster [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref15">15</xref>], but this study suggests that the temporal advantage operates through distinct audience structures: concentrated early-stage mobilization of in-groups versus distributed, delayed expansion into out-groups. From a policy perspective, this mechanism suggests that the critical window for intervention is not merely short (as commonly noted [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref49">49</xref>]) but compressed into a narrow audience demographic, concentrated in the initial 2 weeks post-upload.</p></sec><sec id="s4-3"><title>Implications for Intervention and Governance</title><p>The policy implications of this rapid saturation are 2-fold. First, the 18-day saturation window implies that practitioners must adopt real-time monitoring, as the majority of a video&#x2019;s impact crystallizes faster than traditional fact-checking cycles can respond. Second, since moderation actions in our dataset occurred with a median delay of 14.4 (IQR 4.9-35.8) days [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>], reactive content removal often arrives after the audience has already been saturated.</p><p>Therefore, effective intervention must target early audience composition rather than relying on post hoc removal. These empirical patterns motivate, but do not themselves test, potential intervention strategies. Conceptually, prebunking approaches that inoculate audiences against misinformation narratives [<xref ref-type="bibr" rid="ref52">52</xref>-<xref ref-type="bibr" rid="ref54">54</xref>] are particularly relevant here as they work before the rapid saturation occurs. Furthermore, saturated content is potentially amplified via cross-platform diffusion [<xref ref-type="bibr" rid="ref55">55</xref>]. Platforms should consider proactive algorithmic demotion of borderline content or the elevation of credible sources during the first 2 weeks of a video&#x2019;s lifecycle [<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref57">57</xref>]. Rather than removing vaccine-hesitant content outright&#x2014;a strategy fraught with free-speech concerns and often ineffective after saturation [<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref59">59</xref>]&#x2014;platforms could implement ranking systems that elevate credible sources in recommendation feeds, effectively competing for the attention of early audiences before echo chamber formation. Platform design choices that prioritize engagement metrics inadvertently amplify misinformation by selecting for emotionally resonant content [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref47">47</xref>]; reorienting algorithmic goals toward credibility rather than engagement represents a structural intervention with potential for large-scale impact [<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref60">60</xref>].</p><p>While we found evidence of moderation, the median delay of 14.4 (IQR 4.9-35.8) days becomes critical when considered against the temporal dynamics we identified. Vaccine-hesitant videos concentrate their engagement&#x2014;a pattern indicating rapid in-group mobilization characteristic of echo chambers&#x2014;within approximately 18 days. Since moderation occurs 14.4 (IQR 4.9-35.8) days post-upload on median, content removal actions occur after the most intense period of audience concentration has already occurred, a finding that supports recent work on delayed moderation [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>].</p><p>Given the complexities of content removal [<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref59">59</xref>], one possible policy intervention could be the proactive algorithmic amplification of content from verified health authorities, especially during the early days of a video&#x2019;s lifecycle [<xref ref-type="bibr" rid="ref56">56</xref>,<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref61">61</xref>]. Platform design choices that prioritize engagement can inadvertently amplify misinformation [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref47">47</xref>]; therefore, strategic interventions to elevate credible sources could significantly improve the health information environment without resorting to widespread censorship [<xref ref-type="bibr" rid="ref60">60</xref>].</p><p>Our findings are consistent with these concerns, but we cannot speak directly about recommendation-system mechanisms. We therefore present these governance implications as hypotheses and directions for future experimental and audit studies, rather than as causal claims about the effects of specific policy levers.</p></sec><sec id="s4-4"><title>Discourse Patterns: The Role of Creators and Thematic Framing</title><p>According to our findings, online vaccine discourse is likely driven by two fundamentally different creator ecosystems. Provaccine content is predominantly produced by organizations (news and health institutions), whereas individual creators dominate the vaccine-hesitant space. This sourcing divergence is associated with different discourse patterns we observed: institutional videos tend to become &#x201C;battlegrounds&#x201D; of disagreement, while individual creators host &#x201C;echo chambers&#x201D; of agreement.</p><p>This dynamic may also be further modulated by thematic framing. Health-categorized videos, which attract the highest institutional participation, become the most intense sites of controversy [<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref63">63</xref>]. In contrast, content framed around politics and society allows individual creators to cultivate highly agreeable, insulated communities [<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref64">64</xref>]. This suggests a fundamental tension: institutional voices attempt to maintain a medical frame, but the discourse persistently escapes into social and political contexts where individual voices claim equal standing. To bridge this gap, public health bodies should consider partnerships with credible individual creators&#x2014;such as doctors who vlog&#x2014;who can foster dialogue without triggering immediate polarization [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref66">66</xref>].</p></sec><sec id="s4-5"><title>Institutional Context and Future Policy Dynamics</title><p>It is important to situate these findings within the broader landscape of vaccine policy. Our data collection (November 2024 to May 2025) captures a moment of significant institutional uncertainty. The observed engagement asymmetry likely reflects not merely ambient polarization but the consequence of eroded trust, wherein health institutions themselves become sites of political contestation.</p><p>This raises theoretical questions for future research: Do engagement asymmetries intensify during periods of institutional distrust? Longitudinal monitoring across different policy contexts would clarify whether our findings represent a transient response to uncertainty or a structural feature of polarized health discourse. Additionally, without systematic auditing of recommendation systems, the degree to which these asymmetries reflect platform design versus audience-driven polarization remains an open question [<xref ref-type="bibr" rid="ref67">67</xref>]. Comparative studies across platforms and jurisdictions would strengthen our understanding of these mechanisms.</p></sec><sec id="s4-6"><title>Limitations</title><p>Our study has several limitations that define the scope of our findings.</p><sec id="s4-6-1"><title>Exclusion of Short-Form Video</title><p>Our analysis is intentionally focused on substantive, long-form YouTube videos (1&#x2010;60 minutes) and excludes short-form content like YouTube Shorts. This decision was made because Shorts exhibit fundamentally different engagement dynamics, algorithmic promotion, and content characteristics (eg, lack of transcripts) that would confound our analysis of engagement trajectories and argumentative stances [<xref ref-type="bibr" rid="ref68">68</xref>,<xref ref-type="bibr" rid="ref69">69</xref>]. While this exclusion enhances the internal validity of our findings on deliberative content, it limits their generalizability to the short-form video ecosystem, which represents a growing segment of online media consumption. Given the highly condensed and viral nature of Shorts, we hypothesize that their inclusion would likely amplify the rapid engagement saturation trends observed here, potentially fostering an even faster cycle of misinformation spread. Future research should analyze this content format separately, using methods suited to its visual and algorithmic nature.</p></sec><sec id="s4-6-2"><title>Other Exclusion Criteria</title><p>Besides excluding short-form videos, each step of our collection more precisely defines the scope of this study, and thus limits its generalizability to other scenarios, such as other topics, time periods, or countries. The keyword selection, for instance, may have excluded the content that refers to vaccination obliquely and focuses on mainstream medicine in general [<xref ref-type="bibr" rid="ref70">70</xref>]. Further, the focus of the collection was to sample the posted videos, and it is likely that some viral videos were not included in the sample, diminishing the extent of the skewness of our estimates of engagement. Studies using complementary methodology would be necessary to explore other aspects of the YouTube ecosystem.</p></sec><sec id="s4-6-3"><title>Temporal and Geographic Scope</title><p>Data collection (November 2024 &#x2013; May 2025) coincided with a period of heightened institutional contestation in US health policy. Consequently, the observed engagement dynamics likely characterize periods of high uncertainty rather than stable institutional consensus. Furthermore, as vaccine hesitancy drivers vary globally [<xref ref-type="bibr" rid="ref71">71</xref>], our findings are specific to the US-English context. Cross-cultural research is needed to determine if the &#x201C;engagement advantage&#x201D; of hesitancy is a universal platform feature or a byproduct of specific sociopolitical environments, such as the high political polarization found in the United States.</p></sec><sec id="s4-6-4"><title>Scalable Content Analysis Trade-Offs</title><p>To enable a large-scale longitudinal analysis, we used an LLM-based approach for content classification. While our method achieved high accuracy (84%) and perfect interrater reliability, it has limitations. First, stance classification was based on averaging scores from text excerpts, a method that may not fully capture videos with evolving narratives or strategic ambiguity. Second, the classification of texts is made difficult by the presence of humor, sarcasm, hyperbole, and other rhetorical devices that are challenging for both automated and human annotators to agree on (although the overall performance of the LLM-based approach largely agreed with that of the human labelers). Third, our comment analysis, classifying stance as agree/disagree/neutral, captures the balance of opinion but not the qualitative nature of the discourse. It does not distinguish between constructive debate and toxic trolling, nor does it analyze conversational structures like reply threads, which are important dimensions of online deliberation [<xref ref-type="bibr" rid="ref72">72</xref>,<xref ref-type="bibr" rid="ref73">73</xref>]. These trade-offs between scale and depth offer clear avenues for future qualitative and computational research.</p></sec><sec id="s4-6-5"><title>Sensitivity to Misclassification in Automated Labeling</title><p>Our main constructs rely on automated LLM-based labeling. Validation against human annotations indicates an accuracy of 82.5% for video stance (with almost all errors involving the neutral class rather than confusion between pro- and antivaccine positions) and &#x2248;73% exact agreement for comment agreement, rising to &#x2248;90% when &#x201C;neutral/unrelated&#x201D; is not counted as an error. These error rates imply that misclassification primarily attenuates differences by shifting items toward the neutral or mixed categories, rather than systematically flipping provaccine into vaccine-hesitant content or agreement into disagreement. Given that our core effects are large&#x2014;for example, vaccine-hesitant videos receive 10-fold higher raw interaction volume, 2.8- to 2.9-fold higher per-view engagement rates, and reach 90% of their engagement 20% faster even after controlling for engagement volume&#x2014;the directionality of our findings is robust to plausible levels of label noise. At the comment level, replacing up to 10%&#x2010;15% of labels with their opposite direction would reduce but not reverse the observed pattern. Vaccine-hesitant videos&#x2019; comment sections are dominated by agreement (eg, 40% agree vs 19% disagree), and provaccine videos attract higher disagreement (eg, 36% disagree vs 24% agree), so the classification uncertainty is more likely to bias our estimates toward conservative lower bounds than to generate spurious asymmetries.</p></sec></sec><sec id="s4-7"><title>Conclusions</title><p>This longitudinal study provides systematic evidence that vaccine-hesitant content on YouTube benefits from a distinct engagement advantage: it attracts approximately 10-fold higher raw interaction volume (and 2.8- to 2.9-fold higher per-view engagement rates) relative to provaccine content and reaches audience saturation significantly faster (44% faster in descriptive medians and 20% faster in adjusted regression estimates) than provaccine content. We identify a specific temporal signature&#x2014;an 18-day saturation window&#x2014;driven by audience structure. Vaccine-hesitant videos mobilize homogeneous, self-selected in-groups that generate rapid, confirmatory &#x201C;echo chambers,&#x201D; whereas provaccine content accumulates engagement incrementally through contentious &#x201C;battlegrounds&#x201D; of debate.</p><p>The policy implications of this mechanism are direct. Because the median time to moderation (14.4 days) lags behind the rapid saturation of hesitant narratives, reactive content removal is structurally ill-suited to mitigate misinformation. An effective public health strategy must therefore shift from post hoc rebuttal to proactive intervention. Prebunking campaigns and algorithmic ranking adjustments that elevate credible sources during the critical first 2 weeks of a video&#x2019;s lifecycle represent the most viable levers for competing with the rapid mobilization of hesitant communities.</p><p>While this study is limited to long-form English content and acknowledges the trade-offs inherent to scalable LLM classification, it establishes baseline temporal patterns essential for evidence-based policymaking. Future research must extend beyond single-platform dynamics to examine how recommendation algorithms specifically amplify these asymmetries and how content diffuses across platforms. Ultimately, navigating the complex digital health environment requires not just producing scientific knowledge, but understanding the precise temporal and structural mechanisms by which that knowledge competes for public attention.</p></sec></sec></body><back><ack><p>The authors declare the use of generative artificial intelligence (GAI) in the research and writing process. The authors used GPT-4o mini for zero-shot video and comment classification. Full responsibility for the content and integrity of the final manuscript rests entirely with the authors.</p></ack><notes><sec><title>Funding</title><p>YM acknowledges support from the Lagrange Project of the Institute for Scientific Interchange Foundation (ISI Foundation) funded by Fondazione Cassa di Risparmio di Torino (Fondazione CRT).</p></sec><sec><title>Data Availability</title><p>Data will be made available at OSF/Zenodo upon publication. Full transcripts and comments not released for privacy.</p></sec></notes><fn-group><fn fn-type="con"><p>MT contributed to conceptualization, formal analysis, methodology, visualization, writing of the original draft, investigation, and validation. YM contributed to conceptualization, data curation, visualization, writing of the original draft, investigation, and validation.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">A</term><def><p>against vaccination stance</p></def></def-item><def-item><term id="abb2">API</term><def><p>application programming interface</p></def></def-item><def-item><term id="abb3">CHV</term><def><p>channel video counts</p></def></def-item><def-item><term id="abb4">CR</term><def><p>comment ratio</p></def></def-item><def-item><term id="abb5">CS</term><def><p>controversy score</p></def></def-item><def-item><term id="abb6">HC3</term><def><p>heteroskedasticity-consistent</p></def></def-item><def-item><term id="abb7">HDI</term><def><p>highest density interval</p></def></def-item><def-item><term id="abb8">IF</term><def><p>in favor of vaccination stance</p></def></def-item><def-item><term id="abb9">IRB</term><def><p>institutional review board</p></def></def-item><def-item><term id="abb10">IRR</term><def><p>incidence rate ratio</p></def></def-item><def-item><term id="abb11">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb12">LR</term><def><p>like ratio</p></def></def-item><def-item><term id="abb13">N</term><def><p>neutral to vaccination stance</p></def></def-item><def-item><term id="abb14">OR</term><def><p>odds ratio</p></def></def-item><def-item><term id="abb15">SA</term><def><p>strongly against vaccination stance</p></def></def-item><def-item><term id="abb16">SIF</term><def><p>strongly in favor of vaccination stance</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Orenstein</surname><given-names>WA</given-names> </name><name name-style="western"><surname>Ahmed</surname><given-names>R</given-names> </name></person-group><article-title>Simply put: vaccination saves lives</article-title><source>Proc Natl Acad Sci USA</source><year>2017</year><month>04</month><day>18</day><volume>114</volume><issue>16</issue><fpage>4031</fpage><lpage>4033</lpage><pub-id pub-id-type="doi">10.1073/pnas.1704507114</pub-id><pub-id pub-id-type="medline">28396427</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Correia</surname><given-names>T</given-names> </name><name name-style="western"><surname>Hil&#x00E1;rio</surname><given-names>AP</given-names> </name><name name-style="western"><surname>Guerreiro</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Policy recommendations for healthcare authorities, organizations and professionals on vaccine hesitancy in Europe: from evidence to practice</article-title><source>Health Policy</source><year>2025</year><month>08</month><volume>158</volume><fpage>105361</fpage><pub-id pub-id-type="doi">10.1016/j.healthpol.2025.105361</pub-id><pub-id pub-id-type="medline">40446640</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="web"><article-title>Global partners announce a new effort &#x2013; &#x201C;The Big Catch-Up&#x201D; &#x2013; to vaccinate millions of children and restore immunization progress lost during the pandemic</article-title><source>World Health Organization</source><year>2023</year><month>04</month><day>24</day><access-date>2026-05-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/news/item/24-04-2023-global-partners-announce-a-new-effort-the-big-catch-up-to-vaccinate-millions-of-children-and-restore-immunization-progress-lost-during-the-pandemic">https://www.who.int/news/item/24-04-2023-global-partners-announce-a-new-effort-the-big-catch-up-to-vaccinate-millions-of-children-and-restore-immunization-progress-lost-during-the-pandemic</ext-link></comment></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Paoletti</surname><given-names>G</given-names> </name><name name-style="western"><surname>Dall&#x2019;Amico</surname><given-names>L</given-names> </name><name name-style="western"><surname>Kalimeri</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Political context of the European vaccine debate on Twitter</article-title><source>Sci Rep</source><year>2024</year><month>02</month><day>22</day><volume>14</volume><issue>1</issue><fpage>4397</fpage><pub-id pub-id-type="doi">10.1038/s41598-024-54863-7</pub-id><pub-id pub-id-type="medline">38388713</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Adeoye</surname><given-names>AF</given-names> </name><name name-style="western"><surname>Umoru</surname><given-names>DO</given-names> </name><name name-style="western"><surname>Gomez</surname><given-names>OO</given-names> </name><etal/></person-group><article-title>The 2025 United States Measles Crisis: when vaccine hesitancy meets reality</article-title><source>Cureus</source><year>2025</year><month>07</month><volume>17</volume><issue>7</issue><fpage>e88196</fpage><pub-id pub-id-type="doi">10.7759/cureus.88196</pub-id><pub-id pub-id-type="medline">40827145</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Allen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Watts</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Rand</surname><given-names>DG</given-names> </name></person-group><article-title>Quantifying the impact of misinformation and vaccine-skeptical content on Facebook</article-title><source>Science</source><year>2024</year><month>05</month><day>31</day><volume>384</volume><issue>6699</issue><fpage>eadk3451</fpage><pub-id pub-id-type="doi">10.1126/science.adk3451</pub-id><pub-id pub-id-type="medline">38815040</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wilson</surname><given-names>SL</given-names> </name><name name-style="western"><surname>Wiysonge</surname><given-names>C</given-names> </name></person-group><article-title>Social media and vaccine hesitancy</article-title><source>BMJ Glob Health</source><year>2020</year><month>10</month><volume>5</volume><issue>10</issue><fpage>e004206</fpage><pub-id pub-id-type="doi">10.1136/bmjgh-2020-004206</pub-id><pub-id pub-id-type="medline">33097547</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Faverio</surname><given-names>M</given-names> </name><name name-style="western"><surname>Sidoti</surname><given-names>O</given-names> </name></person-group><article-title>Teens, social media and technology 2024</article-title><source>Pew Research Center</source><year>2024</year><month>12</month><day>12</day><access-date>2026-05-22</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.pewresearch.org/internet/2024/12/12/teens-social-media-and-technology-2024">https://www.pewresearch.org/internet/2024/12/12/teens-social-media-and-technology-2024</ext-link></comment></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Gottfried</surname><given-names>J</given-names> </name><name name-style="western"><surname>Park</surname><given-names>E</given-names> </name></person-group><article-title>Americans&#x2019; social media use 2025</article-title><source>Pew Research Center</source><year>2025</year><month>11</month><day>20</day><access-date>2026-05-22</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.pewresearch.org/internet/2025/11/20/americans-social-media-use-2025">https://www.pewresearch.org/internet/2025/11/20/americans-social-media-use-2025</ext-link></comment></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Basch</surname><given-names>C</given-names> </name><name name-style="western"><surname>Zybert</surname><given-names>P</given-names> </name><name name-style="western"><surname>Reeves</surname><given-names>R</given-names> </name><name name-style="western"><surname>Basch</surname><given-names>C</given-names> </name></person-group><article-title>What do popular YouTube videos say about vaccines?</article-title><source>Child Care Health Dev</source><year>2017</year><volume>43</volume><issue>4</issue><fpage>499</fpage><lpage>503</lpage><pub-id pub-id-type="doi">10.1111/cch.12442</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Fujimoto</surname><given-names>K</given-names> </name><name name-style="western"><surname>Amith</surname><given-names>MT</given-names> </name><etal/></person-group><article-title>&#x201C;Down the rabbit hole&#x201D; of vaccine misinformation on YouTube: network exposure study</article-title><source>J Med Internet Res</source><year>2021</year><month>01</month><day>5</day><volume>23</volume><issue>1</issue><fpage>e23262</fpage><pub-id pub-id-type="doi">10.2196/23262</pub-id><pub-id pub-id-type="medline">33399543</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ng</surname><given-names>YMM</given-names> </name><name name-style="western"><surname>Hoffmann Pham</surname><given-names>K</given-names> </name><name name-style="western"><surname>Luengo-Oroz</surname><given-names>M</given-names> </name></person-group><article-title>Exploring YouTube&#x2019;s recommendation system in the context of COVID-19 vaccines: computational and comparative analysis of video trajectories</article-title><source>J Med Internet Res</source><year>2023</year><month>09</month><day>15</day><volume>25</volume><fpage>e49061</fpage><pub-id pub-id-type="doi">10.2196/49061</pub-id><pub-id pub-id-type="medline">37713243</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jung</surname><given-names>H</given-names> </name><name name-style="western"><surname>Juneja</surname><given-names>P</given-names> </name><name name-style="western"><surname>Mitra</surname><given-names>T</given-names> </name></person-group><article-title>Algorithmic behaviors across regions: a geolocation audit of YouTube search for COVID-19 misinformation between the United States and South Africa</article-title><source>Proc Int AAAI Conf Web Soc Media</source><year>2025</year><month>06</month><volume>19</volume><issue>1</issue><fpage>935</fpage><lpage>964</lpage><pub-id pub-id-type="doi">10.1609/icwsm.v19i1.35854</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chan</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sounderajah</surname><given-names>V</given-names> </name><name name-style="western"><surname>Daniels</surname><given-names>E</given-names> </name><etal/></person-group><article-title>The reliability and quality of YouTube videos as a source of public health information regarding COVID-19 vaccination: cross-sectional study</article-title><source>JMIR Public Health Surveill</source><year>2021</year><volume>7</volume><issue>7</issue><fpage>e29942</fpage><pub-id pub-id-type="doi">10.2196/29942</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vosoughi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Roy</surname><given-names>D</given-names> </name><name name-style="western"><surname>Aral</surname><given-names>S</given-names> </name></person-group><article-title>The spread of true and false news online</article-title><source>Science</source><year>2018</year><month>03</month><day>9</day><volume>359</volume><issue>6380</issue><fpage>1146</fpage><lpage>1151</lpage><pub-id pub-id-type="doi">10.1126/science.aap9559</pub-id><pub-id pub-id-type="medline">29590045</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="web"><article-title>Medical misinformation policy</article-title><source>YouTube</source><access-date>2026-05-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://support.google.com/youtube/answer/13813322?hl=en">https://support.google.com/youtube/answer/13813322?hl=en</ext-link></comment></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Graham</surname><given-names>G</given-names> </name><name name-style="western"><surname>Halprin</surname><given-names>M</given-names> </name></person-group><article-title>A long-term vision for YouTube&#x2019;s medical misinformation policies</article-title><source>YouTube</source><year>2023</year><month>08</month><day>15</day><access-date>2026-05-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://blog.youtube/inside-youtube/a-long-term-vision-for-medical-misinformation-policies/?sjid=13964636406615525454-EU">https://blog.youtube/inside-youtube/a-long-term-vision-for-medical-misinformation-policies/?sjid=13964636406615525454-EU</ext-link></comment></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cinelli</surname><given-names>M</given-names> </name><name name-style="western"><surname>De Francisci Morales</surname><given-names>G</given-names> </name><name name-style="western"><surname>Galeazzi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Quattrociocchi</surname><given-names>W</given-names> </name><name name-style="western"><surname>Starnini</surname><given-names>M</given-names> </name></person-group><article-title>The echo chamber effect on social media</article-title><source>Proc Natl Acad Sci U S A</source><year>2021</year><month>03</month><day>2</day><volume>118</volume><issue>9</issue><fpage>e2023301118</fpage><pub-id pub-id-type="doi">10.1073/pnas.2023301118</pub-id><pub-id pub-id-type="medline">33622786</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Crupi</surname><given-names>G</given-names> </name><name name-style="western"><surname>Mejova</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Tizzani</surname><given-names>M</given-names> </name><name name-style="western"><surname>Paolotti</surname><given-names>D</given-names> </name><name name-style="western"><surname>Panisson</surname><given-names>A</given-names> </name></person-group><article-title>Echoes through time: evolution of the Italian COVID-19 vaccination debate</article-title><source>Proc Int AAAI Conf Web Soc Media</source><year>2022</year><month>05</month><volume>16</volume><fpage>102</fpage><lpage>113</lpage><pub-id pub-id-type="doi">10.1609/icwsm.v16i1.19276</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gruzd</surname><given-names>A</given-names> </name><name name-style="western"><surname>Abul-Fottouh</surname><given-names>D</given-names> </name><name name-style="western"><surname>Song</surname><given-names>MY</given-names> </name><name name-style="western"><surname>Saiphoo</surname><given-names>A</given-names> </name></person-group><article-title>From Facebook to YouTube: the potential exposure to COVID-19 anti-vaccine videos on social media</article-title><source>Soc Media Soc</source><year>2023</year><volume>9</volume><issue>1</issue><fpage>20563051221150403</fpage><pub-id pub-id-type="doi">10.1177/20563051221150403</pub-id><pub-id pub-id-type="medline">36751363</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Garrett</surname><given-names>RK</given-names> </name></person-group><article-title>Echo chambers online? Politically motivated selective exposure among internet news users</article-title><source>J Comput-Mediat Commun</source><year>2009</year><month>01</month><volume>14</volume><issue>2</issue><fpage>265</fpage><lpage>285</lpage><pub-id pub-id-type="doi">10.1111/j.1083-6101.2009.01440.x</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ekram</surname><given-names>S</given-names> </name><name name-style="western"><surname>Debiec</surname><given-names>KE</given-names> </name><name name-style="western"><surname>Pumper</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Moreno</surname><given-names>MA</given-names> </name></person-group><article-title>Content and commentary: HPV vaccine and YouTube</article-title><source>J Pediatr Adolesc Gynecol</source><year>2019</year><month>04</month><volume>32</volume><issue>2</issue><fpage>153</fpage><lpage>157</lpage><pub-id pub-id-type="doi">10.1016/j.jpag.2018.11.001</pub-id><pub-id pub-id-type="medline">30445163</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Garimella</surname><given-names>K</given-names> </name><name name-style="western"><surname>Morales</surname><given-names>GDF</given-names> </name><name name-style="western"><surname>Gionis</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mathioudakis</surname><given-names>M</given-names> </name></person-group><article-title>Quantifying controversy on social media</article-title><source>ACM Trans Social Comput</source><year>2018</year><month>03</month><day>31</day><volume>1</volume><issue>1</issue><fpage>1</fpage><lpage>27</lpage><pub-id pub-id-type="doi">10.1145/3140565</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ka&#x0148;kov&#x00E1;</surname><given-names>J</given-names> </name><name name-style="western"><surname>Binder</surname><given-names>A</given-names> </name><name name-style="western"><surname>Matthes</surname><given-names>J</given-names> </name></person-group><article-title>Health-related communication of social media influencers: a scoping review</article-title><source>Health Commun</source><year>2025</year><month>06</month><volume>40</volume><issue>7</issue><fpage>1300</fpage><lpage>1313</lpage><pub-id pub-id-type="doi">10.1080/10410236.2024.2397268</pub-id><pub-id pub-id-type="medline">39258728</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Mejova</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Kalimeri</surname><given-names>K</given-names> </name></person-group><article-title>COVID-19 on Facebook ads: competing agendas around a public health crisis</article-title><source>Proceedings of the 3rd ACM SIGCAS Conference on Computing and Sustainable Societies</source><year>2020</year><publisher-name>Association for Computing Machinery</publisher-name><fpage>22</fpage><lpage>31</lpage><pub-id pub-id-type="doi">10.1145/3378393.3402241</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Carrieri</surname><given-names>V</given-names> </name><name name-style="western"><surname>Guthmuller</surname><given-names>S</given-names> </name><name name-style="western"><surname>W&#x00FC;bker</surname><given-names>A</given-names> </name></person-group><article-title>Trust and COVID-19 vaccine hesitancy</article-title><source>Sci Rep</source><year>2023</year><month>06</month><day>7</day><volume>13</volume><issue>1</issue><fpage>9245</fpage><pub-id pub-id-type="doi">10.1038/s41598-023-35974-z</pub-id><pub-id pub-id-type="medline">37286569</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rodrigues</surname><given-names>F</given-names> </name><name name-style="western"><surname>Ziade</surname><given-names>N</given-names> </name><name name-style="western"><surname>Jatuworapruk</surname><given-names>K</given-names> </name><name name-style="western"><surname>Caballero-Uribe</surname><given-names>CV</given-names> </name><name name-style="western"><surname>Khursheed</surname><given-names>T</given-names> </name><name name-style="western"><surname>Gupta</surname><given-names>L</given-names> </name></person-group><article-title>The impact of social media on vaccination: a narrative review</article-title><source>J Korean Med Sci</source><year>2023</year><month>10</month><day>16</day><volume>38</volume><issue>40</issue><fpage>e326</fpage><pub-id pub-id-type="doi">10.3346/jkms.2023.38.e326</pub-id><pub-id pub-id-type="medline">37846789</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Major</surname><given-names>D</given-names> </name></person-group><article-title>COVID-19 misinformation cost at least 2,800 lives and $300M, new report says</article-title><source>CBC News</source><year>2023</year><month>01</month><day>26</day><access-date>2026-05-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.cbc.ca/news/politics/cost-of-covid-19-misinformation-study-1.6726356">https://www.cbc.ca/news/politics/cost-of-covid-19-misinformation-study-1.6726356</ext-link></comment></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Mitropoulos</surname><given-names>A</given-names> </name></person-group><article-title>300,000 US COVID deaths could have been averted through vaccination, analysis finds</article-title><source>ABC News</source><year>2022</year><month>05</month><day>16</day><access-date>2026-05-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://abcnews.com/Health/300000-us-covid-deaths-averted-vaccination-analysis-finds/story?id=84753284">https://abcnews.com/Health/300000-us-covid-deaths-averted-vaccination-analysis-finds/story?id=84753284</ext-link></comment></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="web"><article-title>Data API &#x003E; Search: list</article-title><source>YouTube</source><access-date>2026-05-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://developers.google.com/youtube/v3/docs/search/list">https://developers.google.com/youtube/v3/docs/search/list</ext-link></comment></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Betti</surname><given-names>L</given-names> </name><name name-style="western"><surname>De Francisci Morales</surname><given-names>G</given-names> </name><name name-style="western"><surname>Gauvin</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Detecting adherence to the recommended childhood vaccination schedule from user-generated content in a US parenting forum</article-title><source>PLoS Comput Biol</source><year>2021</year><month>04</month><volume>17</volume><issue>4</issue><fpage>e1008919</fpage><pub-id pub-id-type="doi">10.1371/journal.pcbi.1008919</pub-id><pub-id pub-id-type="medline">33901170</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lenti</surname><given-names>J</given-names> </name><name name-style="western"><surname>Mejova</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Kalimeri</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Global misinformation spillovers in the vaccination debate before and during the COVID-19 pandemic: multilingual Twitter study</article-title><source>JMIR Infodemiol</source><year>2023</year><month>05</month><day>24</day><volume>3</volume><fpage>e44714</fpage><pub-id pub-id-type="doi">10.2196/44714</pub-id><pub-id pub-id-type="medline">37223965</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="web"><article-title>Data API &#x003E; videos</article-title><source>YouTube</source><access-date>2026-05-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://developers.google.com/youtube/v3/docs/videos">https://developers.google.com/youtube/v3/docs/videos</ext-link></comment></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="web"><article-title>Transcript API</article-title><source>YouTube</source><access-date>2026-05-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://pypi.org/project/youtube-transcript-api">https://pypi.org/project/youtube-transcript-api</ext-link></comment></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="web"><article-title>Data API &#x003E; Channels: list</article-title><source>YouTube</source><access-date>2026-05-26</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://developers.google.com/youtube/v3/docs/channels/list">https://developers.google.com/youtube/v3/docs/channels/list</ext-link></comment></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>MacDonald</surname><given-names>NE</given-names> </name><collab>SAGE Working Group on Vaccine Hesitancy</collab></person-group><article-title>Vaccine hesitancy: definition, scope and determinants</article-title><source>Vaccine (Auckl)</source><year>2015</year><month>08</month><day>14</day><volume>33</volume><issue>34</issue><fpage>4161</fpage><lpage>4164</lpage><pub-id pub-id-type="doi">10.1016/j.vaccine.2015.04.036</pub-id><pub-id pub-id-type="medline">25896383</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>LC</given-names> </name><name name-style="western"><surname>Eiden</surname><given-names>AL</given-names> </name><name name-style="western"><surname>He</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Natural language processing&#x2013;powered real-time monitoring solution for vaccine sentiments and hesitancy on social media: system development and validation</article-title><source>JMIR Med Inform</source><year>2024</year><month>06</month><day>21</day><volume>12</volume><issue>1</issue><fpage>e57164</fpage><pub-id pub-id-type="doi">10.2196/57164</pub-id><pub-id pub-id-type="medline">38904984</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Landis</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Koch</surname><given-names>GG</given-names> </name></person-group><article-title>The measurement of observer agreement for categorical data</article-title><source>Biometrics</source><year>1977</year><month>03</month><volume>33</volume><issue>1</issue><fpage>159</fpage><lpage>174</lpage><pub-id pub-id-type="doi">10.2307/2529310</pub-id><pub-id pub-id-type="medline">843571</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>W</given-names> </name><name name-style="western"><surname>Luo</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Recent advances in hierarchical multi-label text classification: a survey</article-title><source>arXiv</source><comment>Preprint posted online on  Jul 30, 2023</comment><pub-id pub-id-type="doi">10.48550/arXiv.2307.16265</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Rojas</surname><given-names>KR</given-names> </name><name name-style="western"><surname>Bustamante</surname><given-names>G</given-names> </name><name name-style="western"><surname>Oncevay</surname><given-names>A</given-names> </name><name name-style="western"><surname>Cabezudo</surname><given-names>MAS</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Tetreault</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chai</surname><given-names>J</given-names> </name><name name-style="western"><surname>Schluter</surname><given-names>N</given-names> </name><name name-style="western"><surname>Tetreault</surname><given-names>J</given-names> </name></person-group><article-title>Efficient strategies for hierarchical text classification: external knowledge and auxiliary tasks</article-title><source>Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics</source><year>2020</year><publisher-name>Association for Computational Linguistics</publisher-name><pub-id pub-id-type="doi">10.18653/v1/2020.acl-main.205</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Viola</surname><given-names>P</given-names> </name><name name-style="western"><surname>Jones</surname><given-names>M</given-names> </name></person-group><article-title>Robust real-time face detection</article-title><source>Int J Comput Vis</source><year>2004</year><volume>57</volume><issue>2</issue><fpage>137</fpage><lpage>154</lpage><pub-id pub-id-type="doi">10.1109/iccv.2001.937709</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Hearst</surname><given-names>MA</given-names> </name></person-group><article-title>Automatic acquisition of hyponyms from large text corpora</article-title><source>Proceedings of the 14th International Conference on Computational Linguistics</source><year>1992</year><publisher-name>Association for Computational Linguistics</publisher-name><fpage>539</fpage><lpage>545</lpage><pub-id pub-id-type="doi">10.3115/992133.992154</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Bykau</surname><given-names>S</given-names> </name><name name-style="western"><surname>Korn</surname><given-names>F</given-names> </name><name name-style="western"><surname>Srivastava</surname><given-names>D</given-names> </name><name name-style="western"><surname>Velegrakis</surname><given-names>Y</given-names> </name></person-group><article-title>Fine-grained controversy detection in Wikipedia</article-title><source>2015 IEEE 31st International Conference on Data Engineering (ICDE)</source><year>2015</year><publisher-name>IEEE</publisher-name><fpage>1573</fpage><lpage>1584</lpage><pub-id pub-id-type="doi">10.1109/ICDE.2015.7113426</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Donzelli</surname><given-names>G</given-names> </name><name name-style="western"><surname>Palomba</surname><given-names>G</given-names> </name><name name-style="western"><surname>Federigi</surname><given-names>I</given-names> </name><etal/></person-group><article-title>Misinformation on vaccination: a quantitative analysis of YouTube videos</article-title><source>Hum Vaccin Immunother</source><year>2018</year><month>07</month><day>3</day><volume>14</volume><issue>7</issue><fpage>1654</fpage><lpage>1659</lpage><pub-id pub-id-type="doi">10.1080/21645515.2018.1454572</pub-id><pub-id pub-id-type="medline">29553872</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>T&#x00F6;rnberg</surname><given-names>P</given-names> </name><name name-style="western"><surname>T&#x00F6;rnberg</surname><given-names>A</given-names> </name></person-group><article-title>Inside a white power echo chamber: why fringe digital spaces are polarizing politics</article-title><source>New Media Society</source><year>2024</year><month>08</month><volume>26</volume><issue>8</issue><fpage>4511</fpage><lpage>4533</lpage><pub-id pub-id-type="doi">10.1177/14614448221122915</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Freeman</surname><given-names>D</given-names> </name><name name-style="western"><surname>Loe</surname><given-names>BS</given-names> </name><name name-style="western"><surname>Chadwick</surname><given-names>A</given-names> </name><etal/></person-group><article-title>COVID-19 vaccine hesitancy in the UK: the Oxford coronavirus explanations, attitudes, and narratives survey (Oceans) II</article-title><source>Psychol Med</source><year>2022</year><month>10</month><volume>52</volume><issue>14</issue><fpage>3127</fpage><lpage>3141</lpage><pub-id pub-id-type="doi">10.1017/S0033291720005188</pub-id><pub-id pub-id-type="medline">33305716</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lorenz-Spreen</surname><given-names>P</given-names> </name><name name-style="western"><surname>Oswald</surname><given-names>L</given-names> </name><name name-style="western"><surname>Lewandowsky</surname><given-names>S</given-names> </name><name name-style="western"><surname>Hertwig</surname><given-names>R</given-names> </name></person-group><article-title>A systematic review of worldwide causal and correlational evidence on digital media and democracy</article-title><source>Nat Hum Behav</source><year>2023</year><month>01</month><volume>7</volume><issue>1</issue><fpage>74</fpage><lpage>101</lpage><pub-id pub-id-type="doi">10.1038/s41562-022-01460-1</pub-id><pub-id pub-id-type="medline">36344657</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Geschke</surname><given-names>D</given-names> </name><name name-style="western"><surname>Lorenz</surname><given-names>J</given-names> </name><name name-style="western"><surname>Holtz</surname><given-names>P</given-names> </name></person-group><article-title>The triple-filter bubble: using agent-based modelling to test a meta-theoretical framework for the emergence of filter bubbles and echo chambers</article-title><source>Br J Soc Psychol</source><year>2019</year><month>01</month><volume>58</volume><issue>1</issue><fpage>129</fpage><lpage>149</lpage><pub-id pub-id-type="doi">10.1111/bjso.12286</pub-id><pub-id pub-id-type="medline">30311947</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lewandowsky</surname><given-names>S</given-names> </name><name name-style="western"><surname>van der Linden</surname><given-names>S</given-names> </name></person-group><article-title>Countering misinformation and fake news through inoculation and prebunking</article-title><source>Eur Rev Soc Psychol</source><year>2021</year><month>07</month><volume>32</volume><issue>2</issue><fpage>348</fpage><lpage>384</lpage><pub-id pub-id-type="doi">10.1080/10463283.2021.1876983</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schneider</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Rizoiu</surname><given-names>MA</given-names> </name></person-group><article-title>The effectiveness of moderating harmful online content</article-title><source>Proc Natl Acad Sci USA</source><year>2023</year><month>08</month><volume>120</volume><issue>34</issue><fpage>e2307360120</fpage><pub-id pub-id-type="doi">10.1073/pnas.2307360120</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Truong</surname><given-names>BT</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>S</given-names> </name><name name-style="western"><surname>Nogara</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Delayed takedown of illegal content on social media makes moderation ineffective</article-title><source>arXiv</source><access-date>2026-06-11</access-date><comment>Preprint posted online on  Aug 9, 2025</comment><comment><ext-link ext-link-type="uri" xlink:href="https://arxiv.org/html/2502.08841v2">https://arxiv.org/html/2502.08841v2</ext-link></comment></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Basol</surname><given-names>M</given-names> </name><name name-style="western"><surname>Roozenbeek</surname><given-names>J</given-names> </name><name name-style="western"><surname>van der Linden</surname><given-names>S</given-names> </name></person-group><article-title>Good news about bad news: gamified inoculation boosts confidence and cognitive immunity against fake news</article-title><source>J Cogn</source><year>2020</year><month>01</month><day>10</day><volume>3</volume><issue>1</issue><fpage>2</fpage><pub-id pub-id-type="doi">10.5334/joc.91</pub-id><pub-id pub-id-type="medline">31934684</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roozenbeek</surname><given-names>J</given-names> </name><name name-style="western"><surname>van der Linden</surname><given-names>S</given-names> </name></person-group><article-title>Breaking Harmony Square: a game that &#x201C;inoculates&#x201D; against political misinformation</article-title><source>Harv Kennedy Sch Misinform Rev</source><year>2020</year><month>11</month><day>6</day><volume>1</volume><issue>8</issue><pub-id pub-id-type="doi">10.37016/mr-2020-47</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roozenbeek</surname><given-names>J</given-names> </name><name name-style="western"><surname>van der Linden</surname><given-names>S</given-names> </name><name name-style="western"><surname>Goldberg</surname><given-names>B</given-names> </name><name name-style="western"><surname>Rathje</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lewandowsky</surname><given-names>S</given-names> </name></person-group><article-title>Psychological inoculation improves resilience against misinformation on social media</article-title><source>Sci Adv</source><year>2022</year><month>08</month><day>26</day><volume>8</volume><issue>34</issue><fpage>eabo6254</fpage><pub-id pub-id-type="doi">10.1126/sciadv.abo6254</pub-id><pub-id pub-id-type="medline">36001675</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pierri</surname><given-names>F</given-names> </name><name name-style="western"><surname>DeVerna</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>KC</given-names> </name><name name-style="western"><surname>Axelrod</surname><given-names>D</given-names> </name><name name-style="western"><surname>Bryden</surname><given-names>J</given-names> </name><name name-style="western"><surname>Menczer</surname><given-names>F</given-names> </name></person-group><article-title>One year of COVID-19 vaccine misinformation on Twitter: longitudinal study</article-title><source>J Med Internet Res</source><year>2023</year><month>02</month><day>24</day><volume>25</volume><fpage>e42227</fpage><pub-id pub-id-type="doi">10.2196/42227</pub-id><pub-id pub-id-type="medline">36735835</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mena</surname><given-names>P</given-names> </name></person-group><article-title>Cleaning up social media: the effect of warning labels on likelihood of sharing false news on Facebook</article-title><source>Policy Internet</source><year>2020</year><month>06</month><volume>12</volume><issue>2</issue><fpage>165</fpage><lpage>183</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://onlinelibrary.wiley.com/toc/19442866/12/2">https://onlinelibrary.wiley.com/toc/19442866/12/2</ext-link></comment><pub-id pub-id-type="doi">10.1002/poi3.214</pub-id></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pennycook</surname><given-names>G</given-names> </name><name name-style="western"><surname>Epstein</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Mosleh</surname><given-names>M</given-names> </name><name name-style="western"><surname>Arechar</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Eckles</surname><given-names>D</given-names> </name><name name-style="western"><surname>Rand</surname><given-names>DG</given-names> </name></person-group><article-title>Shifting attention to accuracy can reduce misinformation online</article-title><source>Nature New Biol</source><year>2021</year><month>04</month><volume>592</volume><issue>7855</issue><fpage>590</fpage><lpage>595</lpage><pub-id pub-id-type="doi">10.1038/s41586-021-03344-2</pub-id><pub-id pub-id-type="medline">33731933</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Goldman</surname><given-names>E</given-names> </name></person-group><article-title>Content moderation remedies</article-title><source>Mich Techn Law Rev</source><year>2021</year><volume>28</volume><pub-id pub-id-type="doi">10.36645/mtlr.28.1.content</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Suzor</surname><given-names>N</given-names> </name><name name-style="western"><surname>Van Geelen</surname><given-names>T</given-names> </name><name name-style="western"><surname>Myers West</surname><given-names>S</given-names> </name></person-group><article-title>Evaluating the legitimacy of platform governance: a review of research and a shared research agenda</article-title><source>Int Commun Gaz</source><year>2018</year><month>06</month><volume>80</volume><issue>4</issue><fpage>385</fpage><lpage>400</lpage><pub-id pub-id-type="doi">10.1177/1748048518757142</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bhargava</surname><given-names>VR</given-names> </name><name name-style="western"><surname>Velasquez</surname><given-names>M</given-names> </name></person-group><article-title>Ethics of the attention economy: the problem of social media addiction</article-title><source>Bus Ethics Q</source><year>2021</year><month>07</month><volume>31</volume><issue>3</issue><fpage>321</fpage><lpage>359</lpage><pub-id pub-id-type="doi">10.1017/beq.2020.32</pub-id></nlm-citation></ref><ref id="ref61"><label>61</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Starbird</surname><given-names>K</given-names> </name><name name-style="western"><surname>Arif</surname><given-names>A</given-names> </name><name name-style="western"><surname>Wilson</surname><given-names>T</given-names> </name></person-group><article-title>Disinformation as collaborative work: surfacing the participatory nature of strategic information operations</article-title><source>Proc ACM Hum-Comput Interact</source><year>2019</year><volume>3</volume><fpage>1</fpage><lpage>26</lpage><pub-id pub-id-type="doi">10.1145/3359229</pub-id></nlm-citation></ref><ref id="ref62"><label>62</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gollust</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Lantz</surname><given-names>PM</given-names> </name><name name-style="western"><surname>Ubel</surname><given-names>PA</given-names> </name></person-group><article-title>The polarizing effect of news media messages about the social determinants of health</article-title><source>Am J Public Health</source><year>2009</year><month>12</month><volume>99</volume><issue>12</issue><fpage>2160</fpage><lpage>2167</lpage><pub-id pub-id-type="doi">10.2105/AJPH.2009.161414</pub-id><pub-id pub-id-type="medline">19833981</pub-id></nlm-citation></ref><ref id="ref63"><label>63</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Niederdeppe</surname><given-names>J</given-names> </name><name name-style="western"><surname>Shapiro</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Porticella</surname><given-names>N</given-names> </name></person-group><article-title>Attributions of responsibility for obesity: narrative communication reduces reactive counterarguing among liberals</article-title><source>Hum Commun Res</source><year>2011</year><month>07</month><volume>37</volume><issue>3</issue><fpage>295</fpage><lpage>323</lpage><pub-id pub-id-type="doi">10.1111/j.1468-2958.2011.01409.x</pub-id></nlm-citation></ref><ref id="ref64"><label>64</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Barrera</surname><given-names>O</given-names> </name><name name-style="western"><surname>Guriev</surname><given-names>S</given-names> </name><name name-style="western"><surname>Henry</surname><given-names>E</given-names> </name><name name-style="western"><surname>Zhuravskaya</surname><given-names>E</given-names> </name></person-group><article-title>Facts, alternative facts, and fact checking in times of post-truth politics</article-title><source>J Public Econ</source><year>2020</year><month>02</month><volume>182</volume><fpage>104123</fpage><pub-id pub-id-type="doi">10.1016/j.jpubeco.2019.104123</pub-id></nlm-citation></ref><ref id="ref65"><label>65</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>X</given-names> </name><name name-style="western"><surname>Sin</surname><given-names>SCJ</given-names> </name><name name-style="western"><surname>Theng</surname><given-names>YL</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>CS</given-names> </name></person-group><article-title>Why students share misinformation on social media: motivation, gender, and study-level differences</article-title><source>J Acad Librarianship</source><year>2015</year><month>09</month><volume>41</volume><issue>5</issue><fpage>583</fpage><lpage>592</lpage><pub-id pub-id-type="doi">10.1016/j.acalib.2015.07.003</pub-id></nlm-citation></ref><ref id="ref66"><label>66</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nagler</surname><given-names>RH</given-names> </name><name name-style="western"><surname>Vogel</surname><given-names>RI</given-names> </name><name name-style="western"><surname>Gollust</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Rothman</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Fowler</surname><given-names>EF</given-names> </name><name name-style="western"><surname>Yzer</surname><given-names>MC</given-names> </name></person-group><article-title>Public perceptions of conflicting information surrounding COVID-19: results from a nationally representative survey of U.S. adults</article-title><source>PLoS One</source><year>2020</year><volume>15</volume><issue>10</issue><fpage>e0240776</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0240776</pub-id><pub-id pub-id-type="medline">33085719</pub-id></nlm-citation></ref><ref id="ref67"><label>67</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chandio</surname><given-names>S</given-names> </name><name name-style="western"><surname>Pirwani Dar</surname><given-names>MD</given-names> </name><name name-style="western"><surname>Nithyanand</surname><given-names>R</given-names> </name></person-group><article-title>How audit methods impact our understanding of YouTube&#x2019;s recommendation systems</article-title><source>Proc Int AAAI Conf Weblogs Soc Media</source><year>2024</year><volume>18</volume><fpage>241</fpage><lpage>253</lpage><pub-id pub-id-type="doi">10.1609/icwsm.v18i1.31311</pub-id></nlm-citation></ref><ref id="ref68"><label>68</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>P</given-names> </name><name name-style="western"><surname>Piao</surname><given-names>J</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>F</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name></person-group><article-title>Shorter is different: characterizing the dynamics of short-form video platforms</article-title><source>arXiv</source><comment>Preprint posted online on  Oct 21, 2024</comment><pub-id pub-id-type="doi">10.48550/arXiv.2410.16058</pub-id></nlm-citation></ref><ref id="ref69"><label>69</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Violot</surname><given-names>C</given-names> </name><name name-style="western"><surname>Elmas</surname><given-names>T</given-names> </name><name name-style="western"><surname>Bilogrevic</surname><given-names>I</given-names> </name><name name-style="western"><surname>Humbert</surname><given-names>M</given-names> </name></person-group><article-title>Shorts vs. regular videos on YouTube: a comparative analysis of user engagement and content creation trends</article-title><source>WEBSCI &#x2019;24: Proceedings of the 16th ACM Web Science Conference</source><year>2024</year><publisher-name>Association for Computing Machinery</publisher-name><fpage>213</fpage><lpage>223</lpage><pub-id pub-id-type="doi">10.1145/3614419.3644023</pub-id></nlm-citation></ref><ref id="ref70"><label>70</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lasco</surname><given-names>G</given-names> </name><name name-style="western"><surname>Curato</surname><given-names>N</given-names> </name></person-group><article-title>Medical populism</article-title><source>Soc Sci Med</source><year>2019</year><month>01</month><volume>221</volume><fpage>1</fpage><lpage>8</lpage><pub-id pub-id-type="doi">10.1016/j.socscimed.2018.12.006</pub-id><pub-id pub-id-type="medline">30553118</pub-id></nlm-citation></ref><ref id="ref71"><label>71</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Larson</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>de Figueiredo</surname><given-names>A</given-names> </name><name name-style="western"><surname>Xiahong</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>The state of vaccine confidence 2016: global insights through a 67-country survey</article-title><source>EBioMedicine</source><year>2016</year><month>10</month><volume>12</volume><fpage>295</fpage><lpage>301</lpage><pub-id pub-id-type="doi">10.1016/j.ebiom.2016.08.042</pub-id><pub-id pub-id-type="medline">27658738</pub-id></nlm-citation></ref><ref id="ref72"><label>72</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dubovi</surname><given-names>I</given-names> </name><name name-style="western"><surname>Tabak</surname><given-names>I</given-names> </name></person-group><article-title>An empirical analysis of knowledge co-construction in YouTube comments</article-title><source>Comput Educ</source><year>2020</year><month>10</month><volume>156</volume><fpage>103939</fpage><pub-id pub-id-type="doi">10.1016/j.compedu.2020.103939</pub-id></nlm-citation></ref><ref id="ref73"><label>73</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Miyazaki</surname><given-names>K</given-names> </name><name name-style="western"><surname>Uchiba</surname><given-names>T</given-names> </name><name name-style="western"><surname>Kwak</surname><given-names>H</given-names> </name><name name-style="western"><surname>An</surname><given-names>J</given-names> </name><name name-style="western"><surname>Sasahara</surname><given-names>K</given-names> </name></person-group><article-title>The impact of toxic trolling comments on anti-vaccine YouTube videos</article-title><source>Sci Rep</source><year>2024</year><month>03</month><day>1</day><volume>14</volume><issue>1</issue><fpage>5088</fpage><pub-id pub-id-type="doi">10.1038/s41598-024-54925-w</pub-id><pub-id pub-id-type="medline">38429466</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Data preprocessing and classification, detailed statistical analysis, and top 10 channels&#x2019; description.</p><media xlink:href="jmir_v28i1e88519_app1.docx" xlink:title="DOCX File, 715 KB"/></supplementary-material></app-group></back></article>