<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id><journal-id journal-id-type="publisher-id">formative</journal-id><journal-id journal-id-type="index">27</journal-id><journal-title>JMIR Formative Research</journal-title><abbrev-journal-title>JMIR Form Res</abbrev-journal-title><issn pub-type="epub">2561-326X</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e59687</article-id><article-id pub-id-type="doi">10.2196/59687</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>COVID-19 Public Health Communication on X (Formerly Twitter): Cross-Sectional Study of Message Type, Sentiment, and Source</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Parveen</surname><given-names>Sana</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Pereira</surname><given-names>Agustin Garcia</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Garzon-Orjuela</surname><given-names>Nathaly</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>McHugh</surname><given-names>Patricia</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Surendran</surname><given-names>Aswathi</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Vornhagen</surname><given-names>Heike</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Vellinga</surname><given-names>Akke</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>School of Public Health, Physiotherapy and Sports Science, University College Dublin</institution><addr-line>Belfield, Dublin 4, Ireland</addr-line><addr-line>Dublin</addr-line><country>Ireland</country></aff><aff id="aff2"><institution>Data Science Institute, University of Galway</institution><addr-line>Galway</addr-line><country>Ireland</country></aff><aff id="aff3"><institution>J.E. Cairnes School of Business &#x0026; Economics, University of Galway</institution><addr-line>Galway</addr-line><country>Ireland</country><country>Ireland</country></aff><aff id="aff4"><institution>School of Medicine, Ollscoil na Gaillimhe &#x2013; University of Galway</institution><addr-line>Galway</addr-line><country>Ireland</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Willis</surname><given-names>Erin</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Chandrasekaran</surname><given-names>Ranganathan</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Sana Parveen, PhD, School of Public Health, Physiotherapy and Sports Science, University College Dublin, Belfield, Dublin 4, Ireland, Dublin, D04 V1W8, Ireland, 353 017163445; <email>sana.parveen@ucd.ie</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>19</day><month>3</month><year>2025</year></pub-date><volume>9</volume><elocation-id>e59687</elocation-id><history><date date-type="received"><day>19</day><month>04</month><year>2024</year></date><date date-type="rev-recd"><day>18</day><month>12</month><year>2024</year></date><date date-type="accepted"><day>18</day><month>12</month><year>2024</year></date></history><copyright-statement>&#x00A9; Sana Parveen, Agustin Garcia Pereira, Nathaly Garzon-Orjuela, Patricia McHugh, Aswathi Surendran, Heike Vornhagen, Akke Vellinga. Originally published in JMIR Formative Research (<ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>), 19.3.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://formative.jmir.org/2025/1/e59687"/><abstract><sec><title>Background</title><p>Social media can be used to quickly disseminate focused public health messages, increasing message reach and interaction with the public. Social media can also be an indicator of people&#x2019;s emotions and concerns. Social media data text mining can be used for disease forecasting and understanding public awareness of health-related concerns. Limited studies explore the impact of type, sentiment and source of tweets on engagement. Thus, it is crucial to research how the general public reacts to various kinds of messages from different sources.</p></sec><sec><title>Objective</title><p>The objective of this paper was to determine the association between message type, user (source) and sentiment of tweets and public engagement during the COVID-19 pandemic.</p></sec><sec sec-type="methods"><title>Methods</title><p>For this study, 867,485 tweets were extracted from January 1, 2020 to March 31, 2022 from Ireland and the United Kingdom. A 4-step analytical process was undertaken, encompassing sentiment analysis, bio-classification (user), message classification and statistical analysis. A combination of manual content analysis with abductive coding and machine learning models were used to categorize sentiment, user category and message type for every tweet. A zero-inflated negative binomial model was applied to explore the most engaging content mix.</p></sec><sec sec-type="results"><title>Results</title><p>Our analysis resulted in 12 user categories, 6 message categories, and 3 sentiment classes. Personal stories and positive messages have the most engagement, even though not for every user group; known persons and influencers have the most engagement with humorous tweets. Health professionals receive more engagement with advocacy, personal stories/statements and humor-based tweets. Health institutes observe higher engagement with advocacy, personal stories/statements, and tweets with a positive sentiment. Personal stories/statements are not the most often tweeted category (22%) but have the highest engagement (27%). Messages centered on shock/disgust/fear-based (32%) have a 21% engagement. The frequency of informative/educational communications is high (33%) and their engagement is 16%. Advocacy message (8%) receive 9% engagement. Humor and opportunistic messages have engagements of 4% and 0.5% and low frequenciesof 5% and 1%, respectively. This study suggests the optimum mix of message type and sentiment that each user category should use to get more engagement.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study provides comprehensive insight into Twitter (rebranded as X in 2023) users&#x2019; responses toward various message type and sources. Our study shows that audience engages with personal stories and positive messages the most. Our findings provide valuable guidance for social media-based public health campaigns in developing messages for maximum engagement.</p></sec></abstract><kwd-group><kwd>public health communication</kwd><kwd>surveillance</kwd><kwd>COVID-19</kwd><kwd>SARS-CoV-2</kwd><kwd>coronavirus</kwd><kwd>respiratory</kwd><kwd>infectious</kwd><kwd>pulmonary</kwd><kwd>pandemic</kwd><kwd>public health messaging</kwd><kwd>healthcare information</kwd><kwd>social media</kwd><kwd>tweets</kwd><kwd>text mining</kwd><kwd>data mining</kwd><kwd>social marketing</kwd><kwd>infoveillance</kwd><kwd>intervention planning</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Public health communication is the scientific research, strategic transmission, and critical evaluation of health information to promote public health [<xref ref-type="bibr" rid="ref1">1</xref>]. Public health communication initiatives can result in change by increasing awareness, boosting knowledge and forming attitudes when initiatives are well-planned, meticulously carried out, and sustained over time [<xref ref-type="bibr" rid="ref2">2</xref>].</p><p>Social media can be used to quickly disseminate focused public health messages, increasing message reach and interaction with the general public [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Identifying and understanding information needs, false information, hate speech and discrimination, adherence to precautions, and where concerns lay, aids in the customization of public health strategy and eventually, the development of more informed interventions [<xref ref-type="bibr" rid="ref5">5</xref>].</p><p>Social media can be a valuable resource for learning about people&#x2019;s emotions, concerns and exchanging information. This was shown for instance, when Ebola broke out in Nigeria and public health institutions assisted in containing the Ebola outbreak by tracking social media interactions and disseminating accurate information about the illness [<xref ref-type="bibr" rid="ref6">6</xref>]. Social media allows public health institutions to track outbreaks in real time and Twitter (rebranded as X in 2023) has been frequently used as a communication tool [<xref ref-type="bibr" rid="ref7">7</xref>]. The features and status of disease outbreaks can be predicted and explained using information from social media sites and user-generated information has supported the development of early response methods [<xref ref-type="bibr" rid="ref8">8</xref>].</p><p>Social media data text mining can be used for disease forecasting and understanding public awareness of health-related concerns [<xref ref-type="bibr" rid="ref8">8</xref>]. However, it is still unclear how different social media messages are shared and interpreted or whether different sources (individuals or institutions) communicate efficiently.</p><p>During the COVID-19 pandemic [<xref ref-type="bibr" rid="ref9">9</xref>], social media successfully informed and increased public awareness about this new phenomenon [<xref ref-type="bibr" rid="ref10">10</xref>]. However, there were considerable differences in the preferred social media platforms, message formats and source sender types [<xref ref-type="bibr" rid="ref11">11</xref>].</p><p>An important concern during the COVID-19 pandemic was the spread of misinformation on social media [<xref ref-type="bibr" rid="ref12">12</xref>]. Research shows that promoting more messages from reputable, authoritative sources on social media is one of the best ways to prevent misinformation [<xref ref-type="bibr" rid="ref13">13</xref>].</p><p>Examining the content of social media messages provides valuable and timely insights regarding public awareness levels and their needs [<xref ref-type="bibr" rid="ref14">14</xref>]. While there have been many studies analyzing the tweets on various health issues, there has been limited studies to explore the impact of type, sentiment and source of posts on engagement in public health communication. This study used tweets sent during the pandemic to explore 3 research questions:</p><list list-type="bullet"><list-item><p>Which sources of information are effective in public health communication?</p></list-item><list-item><p>What are the most effective types of messages in public health communication?</p></list-item><list-item><p>Which message type should different sources use to improve engagement?</p></list-item></list></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Data Collection</title><p>Data were extracted from Twitter using a Python script to communicate with Twitter Rest API (application programming interface) using the &#x201C;Search&#x201D; endpoint. The &#x201C;query&#x201D; parameter was used to filter the results based on the &#x201C;has:geo&#x201D; tag, the &#x201C;place_country:UK&#x201D;/ &#x201C;place_country:IE&#x201D; tag (for Ireland and the United Kingdom), and &#x201C;lang:en&#x201D; tag (for English). The &#x201D;start_time&#x201D; and &#x201C;end_time&#x201D; parameters were used to filter the posts from January 1, 2020 to March 31, 2022.</p><p>A basic search was conducted with phrases such as &#x201C;coronavirus,&#x201D; &#x201C;SARS-CoV-2,&#x201D; and &#x201C;COVID-19&#x201D; on Twitter. Using an iterative method, keywords were added and removed in order to find the most suitable for the data search. The final list of 10 keywords for data extraction included &#x201C;COVID-19,&#x201D; &#x201C;pandemic,&#x201D; &#x201C;SARS-CoV-2,&#x201D; &#x201C;coronavirus,&#x201D; &#x201C;SARS-CoV-2 virus,&#x201D; &#x201C;social distancing,&#x201D; &#x201C;self-isolation,&#x201D; &#x201C;self-quarantine,&#x201D; &#x201C;quarantine,&#x201D; and &#x201C;new variant.&#x201D; The total number of tweets extracted totaled 867,485.</p></sec><sec id="s2-2"><title>Data Analysis</title><p>Due to the extensive volume of data, a systematic approach was adopted using a 4-step analytical process including sentiment analysis, user-classification, message classification and statistical analysis (<xref ref-type="table" rid="table1">Table 1</xref>). A combination of manual coding and machine learning (ML) models were used for sentiment, user and message classification. This allowed for multiple rounds of coding to increase the robustness of our results. This methodology is also used by Kummervold et al in their study which shows that by utilizing machine learning models, they could almost exactly match the accuracy of a single human coder when it came to tweet classification. Their research indicates that this automated method, which is dependable and accurate, may be able to guide potentially useful and essential interventions while also freeing up important time and resources for carrying out similar analyses [<xref ref-type="bibr" rid="ref15">15</xref>].</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Phase wise description of the data analysis process.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="top">Phase</td><td align="left" valign="top">Tasks</td><td align="left" valign="top">Methods</td><td align="left" valign="top">Outcome</td></tr></thead><tbody><tr><td align="left" valign="top" rowspan="2">Data collection</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Identification of keywords related to COVID-19</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Identification of 15 keywords.</p></list-item><list-item><p>After discussion among research team, reduced to 10 keywords for data extraction.</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Final keywords</p></list-item></list></td></tr><tr><td align="left" valign="top"><list list-type="bullet"><list-item><p>Data extraction</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>An academic researcher access was applied for with Twitter.</p></list-item><list-item><p>867,485 tweets extracted.</p></list-item></list></td><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Sentiment analysis</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Allocate sentiment to each tweet</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Random selection of 260 tweets for sentiment allocation (positive, negative, and neutral).</p></list-item><list-item><p>A total of 3 coders manually assigned sentiments to 1 set of 260 random tweets.</p></list-item><list-item><p>Using majority voting, out of 260 tweets, coders agreed on 247 tweets (2 or 3 coders voted the same).</p></list-item><list-item><p>Kappa statistic calculated between all coders and the models.</p></list-item><list-item><p>RoBERTa-base model (highest agreement) applied to the whole dataset.</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Manual coded tweets</p></list-item><list-item><p>Kappa statistic results</p></list-item><list-item><p>Tweets sentiment assigned&#x2014;full dataset</p></list-item></list></td></tr><tr><td align="left" valign="top" rowspan="2">User classification</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Identify user categories</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>User categories identified based on literature on social media supported public health interventions.</p></list-item><list-item><p>Definition of 5 user categories: health institute, health professional, influencer, researcher, and public.</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>User categories</p></list-item></list></td></tr><tr><td align="left" valign="top"><list list-type="bullet"><list-item><p>Coding user profiles</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Abductive coding by 4 Manual coders on 1000 randomly selected tweets to identify new user categories.</p></list-item><list-item><p>After 3 rounds of manual coding, most discrepancies or disagreements resolved through discussion.</p></list-item><list-item><p>Using majority voting, out of 250 tweets, coders agreed on 165 tweets (at least 3 coders voted the same).</p></list-item><list-item><p>A total of 3 ML models selected to assign user categories to same set of 250 tweets used in Round 3 of manual coding.</p></list-item><list-item><p>Bag of words were defined for each user category for user categorization by the ML models.</p></list-item><list-item><p>Accuracy score and <italic>F</italic><sub>1</sub>-score calculated between ML models and manual coders.</p></list-item><list-item><p>SetFit model (highest agreement) applied to the whole dataset.</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>User classification coding&#x2014;Round 1, 2, and 3</p></list-item><list-item><p>Bag of words</p></list-item><list-item><p>Accuracy and <italic>F</italic><sub>1</sub>-score</p></list-item><list-item><p>Tweets users assigned&#x2014;full dataset</p></list-item></list></td></tr><tr><td align="left" valign="top" rowspan="2">Message classification</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Identify message categories</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Message categories defined based on review of public health communication literature.</p></list-item><list-item><p>Definition of 5 message categories: humor, shock/disgust, informative/educational, opportunistic, and personal stories.</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Message categories</p></list-item></list></td></tr><tr><td align="left" valign="top"><list list-type="bullet"><list-item><p>Coding tweets</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Abductive coding by 5 manual coders on randomly selected tweets in 3 rounds: 100 tweets in round 1, 100 tweets in round 2, and 250 tweets in round 3.</p></list-item><list-item><p>After 2 rounds of manual coding, discrepancies or disagreements resolved through discussion.</p></list-item><list-item><p>A total of 6 final message categories after addition and reduction of categories over 3 rounds.</p></list-item><list-item><p>Using majority voting, out of 250 tweets, coders agreed on 203 tweets (3 or more coders voted the same).</p></list-item><list-item><p>GPT-3 and Setfit model to assign message categories to set of 250 tweets from the final round using 6 message categories.</p></list-item><list-item><p>Accuracy score and <italic>F</italic><sub>1</sub>-score calculated between models and manual coder.</p></list-item><list-item><p>SetFit model (highest agreement) applied to the whole dataset.</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Manual coding&#x2014;Round 1, 2, and 3</p></list-item><list-item><p>Tweets message assigned&#x2014;Tweet users assigned</p></list-item></list></td></tr><tr><td align="left" valign="top">Statistical analysis</td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Engagement calculation</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Exclusion of zero-follower users (n=537).</p></list-item><list-item><p>Calculation of engagement (sum of likes, replies, retweets and quoted tweet count divided by the respective user&#x2019;s followers)</p></list-item></list></td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"/><td align="left" valign="top"><list list-type="bullet"><list-item><p>Zero-inflation model</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Exclusion of public user group (outside of objective of research) due to 87% zero-engagement.</p></list-item><list-item><p>Application of zero-inflated Poisson and zero-inflated negative binomial model due to remainder of 26% zero-engagement.</p></list-item><list-item><p>Selection of zero-inflated negative binomial model (best fit) with informative/educational message type and neutral sentiment as comparator.</p></list-item></list></td><td align="left" valign="top"><list list-type="bullet"><list-item><p>Final model results</p></list-item></list></td></tr></tbody></table></table-wrap><p>Our cross-sectional observational study aims to provide guidance for social media-based public health campaigns in developing messages for maximum engagement. The study adhered to the Strengthening the Reporting of Observational Studies in Epidemiology (STROBE) checklist for cross-sectional studies (<xref ref-type="supplementary-material" rid="app5">Checklist 1</xref>). Public health interventions are mostly run by governmental agencies or health institutes but can also involve collaborations with researchers, influencers, artists, etc. Therefore, it is important to study how the public engages with different types of messages from various sources. To ensure a clear distinction and understanding of public engagement, tweets by the general public were removed from our final analysis to focus on engagement received by tweets from all other sources.</p><sec id="s2-2-1"><title>Sentiment Analysis</title><p>A subset of 260 tweets was randomly extracted for manual annotation by three coders with sentiment labels - positive, negative or neutral (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Subsequently, we used 3 ML sentiment analysis models to detect the sentiment for the same tweet subset, which were: distilbert-base-uncased-finetuned-sst-2-english [<xref ref-type="bibr" rid="ref16">16</xref>], finite automata/bertweet-base-sentiment-analysis [<xref ref-type="bibr" rid="ref17">17</xref>], and RoBERTa-base for Sentiment Analysis [<xref ref-type="bibr" rid="ref18">18</xref>].</p><p>The kappa statistic was calculated between the 3 coders and between each coder and model. The model with the highest agreement with manual coders based on accuracy score [<xref ref-type="bibr" rid="ref19">19</xref>] and <italic>F</italic><sub>1</sub>-score [<xref ref-type="bibr" rid="ref20">20</xref>] was applied to the full dataset.</p></sec><sec id="s2-2-2"><title>User Classification</title><p>A directed content analysis with abductive coding was used to explore which sources of information are effective in public health communication. User categorization was based on the profile description and categorized according to an adaptation of the user categories from Cole-Lewis [<xref ref-type="bibr" rid="ref21">21</xref>]: health institute, health professional, influencer, researcher and public.</p><p>User coding was performed in 3 cycles. The profile description of 1000 randomly selected tweets were classified by 4 coders with an overlap of 10% for double coding, that is, coders independently assigned codes to the same set of tweets. The 1000 profile descriptions were categorized into 6 distinct categories with a directed content analysis approach [<xref ref-type="bibr" rid="ref22">22</xref>] with an additional category &#x201C;others.&#x201D; This &#x201C;others&#x201D; category was further defined through exploring the profile descriptions, resulting in a total of 12 categories.</p><p>The second round aimed to ensure consistency and accuracy between the coders. In total, 100 randomly selected profile descriptions of tweets were allocated to 12 user categories by each coder (<xref ref-type="table" rid="table2">Table 2</xref>) and agreements, disagreements and potential additions to the categories were discussed. A &#x201C;bag of words&#x201D; was compiled for each user category, providing descriptive insights into the characteristics of the users (<xref ref-type="table" rid="table2">Table 2</xref> and <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>User category and bag of words used for classification.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Index</td><td align="left" valign="bottom">User category</td><td align="left" valign="bottom">Profile keywords&#x2013;&#x201C;bag of words&#x201D; (Version 6)</td></tr></thead><tbody><tr><td align="left" valign="top">1</td><td align="left" valign="top">Health institute</td><td align="left" valign="top">ICGP<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup>; WHO<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup>; NHS<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup>; public health; ECDC<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup>; HSE<sup><xref ref-type="table-fn" rid="table2fn5">e</xref></sup>; HPSC<sup><xref ref-type="table-fn" rid="table2fn6">f</xref></sup>; clinic; hospital</td></tr><tr><td align="left" valign="top">2</td><td align="left" valign="top">Health professional</td><td align="left" valign="top">health worker; GP<sup><xref ref-type="table-fn" rid="table2fn7">g</xref></sup>; consultant; nurse; MD<sup><xref ref-type="table-fn" rid="table2fn8">h</xref></sup>; specialist; physician; clinician; surgeon</td></tr><tr><td align="left" valign="top">3</td><td align="left" valign="top">University/Researcher</td><td align="left" valign="top">university; researcher; PhD; student; scientist; academic professor; academia; principal lecturer</td></tr><tr><td align="left" valign="top">4</td><td align="left" valign="top">Influencer</td><td align="left" valign="top">influencer; blogger; vlogger; coach; YouTube</td></tr><tr><td align="left" valign="top">5</td><td align="left" valign="top">Teacher</td><td align="left" valign="top">teacher; teach; school; education; children</td></tr><tr><td align="left" valign="top">6</td><td align="left" valign="top">Politician</td><td align="left" valign="top">politics; government; governor; cabinet; council; minister; councilor; ambassador; MP;<sup><xref ref-type="table-fn" rid="table2fn9">i</xref></sup> Secretary of state; Fine Gael; TD<sup><xref ref-type="table-fn" rid="table2fn10">j</xref></sup>; Mayor</td></tr><tr><td align="left" valign="top">7</td><td align="left" valign="top">Sports</td><td align="left" valign="top">football; rugby; run; swim; tennis; exercise; sports club; pickleball</td></tr><tr><td align="left" valign="top">8</td><td align="left" valign="top">Journalist</td><td align="left" valign="top">journalist; report; news; reporter; columnist; reviewer; media; correspondent; editor</td></tr><tr><td align="left" valign="top">9</td><td align="left" valign="top">Charity</td><td align="left" valign="top">charity; church; ngo; foundation; donations</td></tr><tr><td align="left" valign="top">10</td><td align="left" valign="top">Public</td><td align="left" valign="top">community; union; group; nature; lover; adventure; travel; live; life; world; freedom; farm; pet; cat; dog; walks</td></tr><tr><td align="left" valign="top">11</td><td align="left" valign="top">Known personality</td><td align="left" valign="top">views my own, &#x201C;True&#x201D; in verified status</td></tr><tr><td align="left" valign="top">12</td><td align="left" valign="top">Artist</td><td align="left" valign="top">artist; actor; actress; music; writer; singer; photography; movie; sing; play; cinema, orchestra</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>ICGP: Irish College of General Practitioners.</p></fn><fn id="table2fn2"><p><sup>b</sup>WHO: World Health Organization.</p></fn><fn id="table2fn3"><p><sup>c</sup>NHS: National Health Service.</p></fn><fn id="table2fn4"><p><sup>d</sup>ECDC: European Centre for Disease Prevention and Control.</p></fn><fn id="table2fn5"><p><sup>e</sup>HSE: Health Service Executive</p></fn><fn id="table2fn6"><p><sup>f</sup>HPSC: Health Protection Surveillance Centre.</p></fn><fn id="table2fn7"><p><sup>g</sup>GP: General Practitioner.</p></fn><fn id="table2fn8"><p><sup>h</sup>MD: Doctor of Medicine.</p></fn><fn id="table2fn9"><p><sup>i</sup>MP: Member of Parliament.</p></fn><fn id="table2fn10"><p><sup>j</sup>TD: Teachta D&#x00E1;la.</p></fn></table-wrap-foot></table-wrap><p>In the third round, 250 randomly selected profile descriptions were coded by 4 coders and compared with 3 different ML models using the same bag of words: Lbl2TransformerVec model (unsupervised) [<xref ref-type="bibr" rid="ref23">23</xref>], SGRank model [<xref ref-type="bibr" rid="ref24">24</xref>], and SetFit model [<xref ref-type="bibr" rid="ref23">23</xref>].</p><p>The ML models classified many influencers as &#x201C;Public,&#x201D; which was rectified by allocating influencer to any user with more than 3000 followers. The 3 models&#x2019; performance was evaluated using the profile descriptions of 250 tweets (third round of coding) from 4 coders. Majority voting was used to generate a final coding for the 250 profile descriptions and filtering out profiles that had less than 3 coders agreement. A final dataset of 165 profile descriptions was left after this filtering. The 3 models performance was compared with the manual allocation and the final classification was based on the majority allocation.</p></sec><sec id="s2-2-3"><title>Message Classification</title><p>Similar to the user classification, a directed content analysis with abductive coding was applied. A review of literature resulted in the identification of 5 message categories from a study by Gough et al [<xref ref-type="bibr" rid="ref25">25</xref>], which are humor, shock/disgust, educational/informative, personal stories, and opportunistic. The dataset was divided into 2 subsets&#x2014;public tweets and nonpublic tweets&#x2014;to determine which type of messages the public engages with most.</p><p>A total of 3 manual coding cycles were applied, starting the allocation of 100 random nonpublic tweets to the five message categories and an &#x201C;other&#x201D; category. In addition, 2 additional categories emerged, namely, fear and advocacy.</p><p>In Round 2, a total of 5 coders allocated 100 tweets to 7 message categories and discussed agreements and disagreements leading to a refinement of the message categories. Fear-based messaging was combined with shock/disgust, personal stories were combined with personal statements and a &#x201C;not enough information&#x201D; category was added. In the final round, 250 tweets were categorised into 7 message categories, which are humor, shock/disgust/fear-based, educational/informative, personal stories/statements, opportunistic, advocacy, and not enough info, and compared to 2 ML models (GPT-3 [OpenAI] and SetFit; <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>).</p></sec><sec id="s2-2-4"><title>Statistical Analysis</title><p>For each tweet, engagement was calculated as the sum of likes, replies, retweets, and quoted tweet count divided by the respective user&#x2019;s follower count [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>].</p><p>For 87% of the tweets, the engagement was zero due to the lack of followers or likes, replies, or quotes (mainly public users). The final dataset excluded this user category resulting in the reduction to 26% zeros. Zero-inflated Poisson and zero-inflated negative binomial models were applied.</p></sec></sec><sec id="s2-3"><title>Ethical Considerations</title><p>Only publicly available data were extracted for this study. All personal identifiable information was deidentified during the data cleaning process.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p>The total number of tweets extracted was 867,485, which reduced to 802,042 after deleting duplicates. Majority of the tweets (729,619) came from the United Kingdom, 72,350 from Ireland, and 73 were without a location.</p><p>The follower count for the dataset showed a wide range, from a maximum of 14,065,098 followers to 0 followers, with an average of 4296 followers. Accounts (users) without followers were investigated to identify inactive accounts or bots and 537 users were removed from the dataset.</p><p>Public user category tweets (430,760) were removed from the final dataset as they were not a user category of interest. The final dataset included 370,745 tweets.</p><sec id="s3-1"><title>Sentiment Analysis</title><p>Out of 260 tweets, coders agreed on 247 tweets (this is when 2-3 coders voted the same), which were compared with the accuracy score and <italic>F</italic><sub>1</sub>-score (weighted) of the 3 ML models. The RoBERTa-base (Model 3) performed the best and was used to assign sentiment to all tweets (<xref ref-type="table" rid="table3">Table 3</xref>).</p><p>Sentiment was negative for 138,379 tweets (37.3%), positive for 84,939 (22.9%), and neutral for 147,427 tweets (39.8%). Positive sentiment tweets had the highest engagement (29.3%), followed by negative (26.7%) and neutral (20.4%; <xref ref-type="table" rid="table4">Table 4</xref>).</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Accuracy and <italic>F</italic><sub>1</sub>-score for sentiment models with machine learning models.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">Accuracy</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score (weighted)</td></tr></thead><tbody><tr><td align="left" valign="top">1&#x2013;Distilbert-base-uncased-finetuned-sst-2-english</td><td align="left" valign="top">0.68</td><td align="left" valign="top">0.61</td></tr><tr><td align="left" valign="top">2&#x2013;Finite automata/bertweet-base-sentiment-analysis</td><td align="left" valign="top">0.58</td><td align="left" valign="top">0.61</td></tr><tr><td align="left" valign="top">3&#x2013;RoBERTa-base</td><td align="left" valign="top">0.74</td><td align="left" valign="top">0.76</td></tr></tbody></table></table-wrap><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Frequency and engagement for each sentiment category.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Sentiment</td><td align="left" valign="bottom">Engagement, %</td><td align="left" valign="bottom">Frequency, %</td></tr></thead><tbody><tr><td align="left" valign="top">Positive</td><td align="char" char="." valign="top">29.3</td><td align="char" char="." valign="top">22.9</td></tr><tr><td align="left" valign="top">Negative</td><td align="char" char="." valign="top">26.7</td><td align="char" char="." valign="top">37.3</td></tr><tr><td align="left" valign="top">Neutral</td><td align="char" char="." valign="top">20.4</td><td align="char" char="." valign="top">39.8</td></tr></tbody></table></table-wrap></sec><sec id="s3-2"><title>User Classification</title><p>Model 3 (assisted) achieved an accuracy score of 0.73 when 4 to 5 coders were in agreement, and achieved an accuracy score of 0.77 when there was at least one match with one coder&#x2014;192/250 tweets (<xref ref-type="table" rid="table5">Table 5</xref>).</p><p>Health professionals (8%) significantly outnumbered health institutes (1%), while the number of influencers (32%) was more than twice that of journalists (15%) and politicians (13%). Artists (6%) outnumbered individuals associated with sports (2%), and teachers (3%) were one-third in comparison to university/researchers (14%), see <xref ref-type="table" rid="table6">Table 6</xref>.</p><p><xref ref-type="table" rid="table7">Table 7</xref> shows the frequency and percentage of engagement for each user category and provides valuable insights into their impact and effectiveness in engaging audiences. Health professionals have the highest level of engagement (15%), followed by university/researchers (13%) despite a lower frequency (8%). Even though influencers have high frequency (32%) it does not translate into high engagement with influencers having a lower percentage of engagement at 12%.</p><p>Journalists and politicians account for 15% and 13%, respectively, with 8% engagement each. Teachers, known personalities. and charities received engagement of 6%, 4%, and 3%, respectively, at lower frequencies. Sports and health Institutes have the lowest engagement each at 1%.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Accuracy and <italic>F</italic><sub>1</sub>-score for user classification with machine learning models.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">Accuracy</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score (weighted)</td></tr></thead><tbody><tr><td align="left" valign="top">1-Lbl2TransformerVec</td><td align="left" valign="top">0.26</td><td align="left" valign="top">0.21</td></tr><tr><td align="left" valign="top">2-SGRank</td><td align="left" valign="top">0.43</td><td align="left" valign="top">0.43</td></tr><tr><td align="left" valign="top">3-SetFit</td><td align="left" valign="top">0.69</td><td align="left" valign="top">0.67</td></tr><tr><td align="left" valign="top">3-SetFit (assisted)</td><td align="left" valign="top">0.73</td><td align="left" valign="top">0.73</td></tr></tbody></table></table-wrap><table-wrap id="t6" position="float"><label>Table 6.</label><caption><p>User categories and their frequency.</p></caption><table id="table6" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">User categories</td><td align="left" valign="bottom">Frequency, n</td><td align="left" valign="bottom">Frequency, %</td></tr></thead><tbody><tr><td align="left" valign="top">Influencer</td><td align="left" valign="top">119,711</td><td align="left" valign="top">32.3</td></tr><tr><td align="left" valign="top">Journalist</td><td align="left" valign="top">54,384</td><td align="left" valign="top">14.7</td></tr><tr><td align="left" valign="top">University/Researcher</td><td align="left" valign="top">50,275</td><td align="left" valign="top">13.6</td></tr><tr><td align="left" valign="top">Politician</td><td align="left" valign="top">47,694</td><td align="left" valign="top">12.9</td></tr><tr><td align="left" valign="top">Health professional</td><td align="left" valign="top">28,963</td><td align="left" valign="top">7.8</td></tr><tr><td align="left" valign="top">Artist</td><td align="left" valign="top">21,730</td><td align="left" valign="top">5.9</td></tr><tr><td align="left" valign="top">Known personality</td><td align="left" valign="top">15,095</td><td align="left" valign="top">4.1</td></tr><tr><td align="left" valign="top">Teacher</td><td align="left" valign="top">12,019</td><td align="left" valign="top">3.2</td></tr><tr><td align="left" valign="top">Charity</td><td align="left" valign="top">11,788</td><td align="left" valign="top">3.2</td></tr><tr><td align="left" valign="top">Sports</td><td align="left" valign="top">5659</td><td align="left" valign="top">1.5</td></tr><tr><td align="left" valign="top">Health institute</td><td align="left" valign="top">3427</td><td align="left" valign="top">0.9</td></tr></tbody></table></table-wrap><table-wrap id="t7" position="float"><label>Table 7.</label><caption><p>Frequency and engagement for each user category excluding public.</p></caption><table id="table7" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">User category</td><td align="left" valign="bottom">Engagement, %</td><td align="left" valign="bottom">Frequency, %</td></tr></thead><tbody><tr><td align="left" valign="top">Health institute</td><td align="char" char="." valign="top">0.7</td><td align="char" char="." valign="top">0.9</td></tr><tr><td align="left" valign="top">Sports</td><td align="char" char="." valign="top">1.4</td><td align="char" char="." valign="top">1.5</td></tr><tr><td align="left" valign="top">Charity</td><td align="char" char="." valign="top">3.2</td><td align="char" char="." valign="top">3.2</td></tr><tr><td align="left" valign="top">Teacher</td><td align="char" char="." valign="top">5.5</td><td align="char" char="." valign="top">3.2</td></tr><tr><td align="left" valign="top">Known personality</td><td align="char" char="." valign="top">4.1</td><td align="char" char="." valign="top">4.1</td></tr><tr><td align="left" valign="top">Artist</td><td align="char" char="." valign="top">6.1</td><td align="char" char="." valign="top">5.9</td></tr><tr><td align="left" valign="top">Health professional</td><td align="char" char="." valign="top">15.2</td><td align="char" char="." valign="top">7.8</td></tr><tr><td align="left" valign="top">Politician</td><td align="char" char="." valign="top">7.8</td><td align="char" char="." valign="top">12.9</td></tr><tr><td align="left" valign="top">University/Researcher</td><td align="char" char="." valign="top">12.7</td><td align="char" char="." valign="top">13.6</td></tr><tr><td align="left" valign="top">Journalist</td><td align="char" char="." valign="top">8.2</td><td align="char" char="." valign="top">14.7</td></tr><tr><td align="left" valign="top">Influencer</td><td align="char" char="." valign="top">11.5</td><td align="char" char="." valign="top">32.3</td></tr></tbody></table></table-wrap></sec><sec id="s3-3"><title>Message Classification</title><p>The 2 models&#x2019; performance was evaluated using 250 tweets from 5 coders. Majority voting was used to generate a final coding for the 250 tweets, and filtering out tweets that had less than 3 coders agreement. In addition, 11 tweets were removed because they were identified by the coders as &#x201C;Not enough information&#x201D; to code. A final dataset of 203 tweets was left after this filtering. SetFit outperformed GPT-3 and this model achieved 80% accuracy when considering a match with at least 1 coder (192/239 tweets; <xref ref-type="table" rid="table8">Table 8</xref>).</p><p>Personal stories/statements have the highest engagement at 27%, but are not the most frequent tweeted category (22%; <xref ref-type="table" rid="table9">Table 9</xref>). Shock/disgust/fear-based messages (32%) have 21% engagement. Informative/educational messages have high frequencies (33%) and have 16% engagement. Advocacy messages (8%) have 9% engagement and humor and opportunistic messages have engagements of 4% and 0.5%, and low frequencies 5% and 1%, respectively (<xref ref-type="table" rid="table10">Table 10</xref>).</p><table-wrap id="t8" position="float"><label>Table 8.</label><caption><p>Accuracy and <italic>F</italic><sub>1</sub>-score for user classification with machine learning (ML) models.</p></caption><table id="table8" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom" colspan="2">4 and 5 coders agreement</td><td align="left" valign="bottom" colspan="2">3, 4, or 5 coders agreement</td></tr><tr><td align="left" valign="top"/><td align="left" valign="top">Accuracy</td><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score (weighted)</td><td align="left" valign="top">Accuracy</td><td align="left" valign="top"><italic>F</italic><sub>1</sub>-score (weighted)</td></tr></thead><tbody><tr><td align="left" valign="top">GPT-3</td><td align="left" valign="top">0.60</td><td align="left" valign="top">0.60</td><td align="left" valign="top">0.51</td><td align="left" valign="top">0.49</td></tr><tr><td align="left" valign="top">SetFit</td><td align="left" valign="top">0.74</td><td align="left" valign="top">0.74</td><td align="left" valign="top">0.64</td><td align="left" valign="top">0.62</td></tr></tbody></table></table-wrap><table-wrap id="t9" position="float"><label>Table 9.</label><caption><p>Frequency and engagement for each message type.</p></caption><table id="table9" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Message type</td><td align="left" valign="bottom">Engagement, %</td><td align="left" valign="bottom">Frequency, %</td></tr></thead><tbody><tr><td align="left" valign="top">Opportunistic</td><td align="char" char="." valign="top">0.5</td><td align="char" char="." valign="top">0.7</td></tr><tr><td align="left" valign="top">Humor</td><td align="char" char="." valign="top">3.7</td><td align="char" char="." valign="top">4.7</td></tr><tr><td align="left" valign="top">Advocacy</td><td align="char" char="." valign="top">9.1</td><td align="char" char="." valign="top">8.5</td></tr><tr><td align="left" valign="top">Personal stories/statements</td><td align="char" char="." valign="top">26.7</td><td align="char" char="." valign="top">21.8</td></tr><tr><td align="left" valign="top">Shock/disgust/fear-based</td><td align="char" char="." valign="top">21</td><td align="char" char="." valign="top">31.9</td></tr><tr><td align="left" valign="top">Informative/educational</td><td align="char" char="." valign="top">15.5</td><td align="char" char="." valign="top">32.5</td></tr></tbody></table></table-wrap><table-wrap id="t10" position="float"><label>Table 10.</label><caption><p>Message types frequency and engagement percentage.</p></caption><table id="table10" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Message category</td><td align="left" valign="bottom">Example tweet</td><td align="left" valign="bottom">Frequency, n</td><td align="left" valign="bottom">Engagement, %</td></tr></thead><tbody><tr><td align="left" valign="top">Informative/ educational</td><td align="left" valign="top">Coronavirus Daily Update: As at 06 Mar 2022, in the Isle of Man there have been 23328 confirmed cases. #coronavirus #iom #coronaupdate</td><td align="left" valign="top">120,317</td><td align="left" valign="top">15.5</td></tr><tr><td align="left" valign="top">Shock/disgust/ fear-based</td><td align="left" valign="top">@Mysturji @AntacsB @Keir_Starmer General strike? We&#x2019;re already basically on one.<break/>Take to the streets? And die of a pandemic?</td><td align="left" valign="top">118,238</td><td align="left" valign="top">21</td></tr><tr><td align="left" valign="top">Personal stories/ statements</td><td align="left" valign="top">Celebrating my end of Self-isolation period with some improvised gluten free macaroni and, er, fussili and cheese. #norecipe #foodie #satisfied @ Dublin, Ireland</td><td align="left" valign="top">80,881</td><td align="left" valign="top">26.7</td></tr><tr><td align="left" valign="top">Advocacy</td><td align="left" valign="top">&#x201A;&#x00C4;&#x00F2;Each person who has died in this pandemic is a loved person, a life gone too soon and a family torn apart.'<break/>Hold a public inquiry into the Government&#x2019;s handling of the Covid-19 pandemic<break/>#Covid19 - Sign the Petition!</td><td align="left" valign="top">31,340</td><td align="left" valign="top">9.1</td></tr><tr><td align="left" valign="top">Humor</td><td align="left" valign="top">The government says we need to exercise social distancing, stay indoors as much as possible and behave like other people might be carrying a disease like this is all new, but I&#x201A;&#x00C4;&#x00F4;ve been doing it since about 2002 #introvert #hermit</td><td align="left" valign="top">17,302</td><td align="left" valign="top">3.7</td></tr><tr><td align="left" valign="top">Opportunistic</td><td align="left" valign="top">In light of #pandemic financial challenges for families, I considered the 10% property tax base increase on Waterford #households trying to recover from the pandemic morally wrong in 2020.<break/>Yesterday I voted against #LPT 10% increase &#x0026;amp; my party again!</td><td align="left" valign="top">2667</td><td align="left" valign="top">0.5</td></tr></tbody></table></table-wrap></sec><sec id="s3-4"><title>Statistical Analysis</title><p>A zero-inflated negative binomial model was applied with informative/educational tweets and neutral sentiment as reference categories. Health professionals received more engagement with advocacy, personal stories/statements and humor. Health Institutes observe higher engagement with advocacy, personal stories/statements and tweets with a positive sentiment (<xref ref-type="supplementary-material" rid="app4">Multimedia Appendix 4</xref>).</p><p>Journalists and teachers observe higher engagement with advocacy, personal stories/statements and humor while artists have more engagement with shock/disgust/fear-based messages and positive sentiment. Charity organizations, universities, and researchers have more engagement with advocacy and personal stories/statements but not with shock/disgust/fear tweets.</p><p>Known personalities have most engagement with advocacy and humor-based, which is opposite for sports entities. Sports entities have more engagement with personal stories/statements and positive sentiment. Politicians and influencers have more engagement with advocacy, personal stories/statements and humor, while they should avoid opportunistic tweets. <xref ref-type="table" rid="table11">Table 11</xref> shows the message type and sentiment each user category should tweet and avoid to get maximum engagement.</p><table-wrap id="t11" position="float"><label>Table 11.</label><caption><p>Findings of zero-inflated model.</p></caption><table id="table11" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">User category</td><td align="left" valign="bottom">Message type to post</td><td align="left" valign="bottom">Message type to avoid</td></tr></thead><tbody><tr><td align="left" valign="top">Health Institute</td><td align="left" valign="top">Advocacy, personal stories/statements, and positive sentiment</td><td align="left" valign="top">Opportunistic, shock/disgust/fear-based, and negative sentiment</td></tr><tr><td align="left" valign="top">Artist</td><td align="left" valign="top">Shock/disgust/fear-based and positive sentiment</td><td align="left" valign="top">Humor and opportunistic</td></tr><tr><td align="left" valign="top">Charity</td><td align="left" valign="top">Advocacy and personal stories/statements</td><td align="left" valign="top">Humor and negative sentiment</td></tr><tr><td align="left" valign="top">Journalist</td><td align="left" valign="top">Advocacy, personal stories/statements and humor</td><td align="left" valign="top">Shock/disgust/fear-based and negative sentiment</td></tr><tr><td align="left" valign="top">Known personality</td><td align="left" valign="top">Advocacy and humor</td><td align="left" valign="top">Shock/ disgust/fear-based</td></tr><tr><td align="left" valign="top">Teacher</td><td align="left" valign="top">Advocacy, personal stories/statements and humor</td><td align="left" valign="top">Shock/disgust/fear-based and negative sentiment</td></tr><tr><td align="left" valign="top">Health professional</td><td align="left" valign="top">Advocacy and personal stories/statements</td><td align="left" valign="top">Opportunistic and shock/disgust/fear-based</td></tr><tr><td align="left" valign="top">Influencer</td><td align="left" valign="top">Advocacy, personal stories/statements and Humor</td><td align="left" valign="top">Opportunistic and negative sentiment</td></tr><tr><td align="left" valign="top">Sports</td><td align="left" valign="top">Personal stories/statements and positive sentiment</td><td align="left" valign="top">Shock/disgust/fear-based</td></tr><tr><td align="left" valign="top">Politician</td><td align="left" valign="top">Advocacy, personal stories/statements, and humor</td><td align="left" valign="top">Opportunistic and negative sentiment</td></tr><tr><td align="left" valign="top">University/Researcher</td><td align="left" valign="top">Advocacy and personal stories/statements</td><td align="left" valign="top">Shock/disgust/fear-based and negative sentiment</td></tr></tbody></table></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This analysis of type, sentiment, and source of COVID-19&#x2013;related tweets showed what type of tweets have the most engagement for each user group. Overall, personal stories and positive messages have most engagement, even though not for every user group; known persons and influencers have most engagement with humorous tweets. Journalists and teachers were found to have flexibility in their posting strategies, with advocacy, personal stories/statements, and humor being effective for them as well. Artists garnered the most engagement with shock/disgust/fear-based and positive sentiment posts, while charity organizations and universities/researchers had advocacy and personal stories/statements as more engaging message types. Known personalities and sports entities also displayed varying engagement for message types and sentiments, with the former having advocacy and humor-based posts more engaging, while the latter should focus on personal stories/statements and positive sentiment. Politicians and influencers, on the other hand, exhibited higher engagement with advocacy, personal stories/statements, and shock/disgust/fear-based messages, while avoiding opportunistic content.</p><p>Positive sentiments in public health messages typically evoke feelings of hope, encouragement, and trust among users, leading to increased sharing behavior [<xref ref-type="bibr" rid="ref28">28</xref>]. Users are more inclined to engage with and share positive messages that resonate with them emotionally, as they perceive such content as uplifting and supportive [<xref ref-type="bibr" rid="ref28">28</xref>]. This explains the high engagement received by positive sentiment tweets despite having lower frequency, as shown in <xref ref-type="table" rid="table4">Table 4</xref> in this study. Our initial manual categorization ensured a reliable baseline for sentiment analysis in this study. The frequency of negative sentiment tweets and their engagement reflects the widespread anxiety, fear, and uncertainty during the pandemic [<xref ref-type="bibr" rid="ref29">29</xref>]. The high engagement of tweets with negative sentiments further emphasizes the need to consider emotional content in information dissemination on social media platforms such as Twitter. In this context, future studies should explore the specific impact of tweets by analyzing the responses they generate, including retweets with quotes and replies. This approach would provide additional insights and allow us to evaluate whether tweets achieve their intended impact.</p><p>The findings of this study revealed distinct patterns of public engagement across different user categories and message types. Trusted sources are important in shaping public behavior and engagement with health information during crises [<xref ref-type="bibr" rid="ref30">30</xref>]. Overall, in the case of users, health professionals received high engagement during the pandemic whereas health institutes received the lowest engagement, maybe reflecting their different use of messages. This highlights the importance of using specific message types for each user category to achieve engagement, as recommended by our study. In addition, health experts, such as general practitioners, communicate health information with greater credibility and persuasiveness than nonexperts or institutes [<xref ref-type="bibr" rid="ref31">31</xref>].</p><p>Internet-based health communities and social media platforms influence public health behaviors and engagement levels [<xref ref-type="bibr" rid="ref32">32</xref>]. The definition and expansion of sources (user categories) in this study provides a framework to develop specific messaging by user group. Our findings reiterate the importance of understanding audience and tailoring engagement strategies based on category-specific behaviors for optimal engagement [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref35">35</xref>].</p></sec><sec id="s4-2"><title>Comparison With Previous Work</title><p>Most studies have focused on the content of the tweets to understand public reactions or sentiment [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>], trends during the COVID-19 pandemic [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>], or vaccinations [<xref ref-type="bibr" rid="ref40">40</xref>-<xref ref-type="bibr" rid="ref42">42</xref>].</p><p>In one study, Twitter data were explored using machine learning to examine how public opinions and discussions changed throughout the COVID-19 epidemic [<xref ref-type="bibr" rid="ref36">36</xref>]. Trends in social media discussions during the pandemic were explored using sentiment analysis and topic modeling, which produced useful information about the public discussion around the pandemic [<xref ref-type="bibr" rid="ref38">38</xref>]. These studies focused mainly on the content of tweets and their engagement but did not explore their association with sources, message type, or sentiments.</p><p>The classification of tweets based on types enriched the analysis by capturing the multifaceted nature of communication during the pandemic and provided an understanding of how different message categories influence public engagement and sharing behavior. This study also added to the existing literature by introducing 2 new message categories&#x2014;advocacy and personal statements&#x2014;while modifying the existing categories to enable application and provide guidance in framing future public health communications.</p><p>Public health literature on message types is very limited. A scoping review on the health risk communication with the public during a pandemic found a lack of studies on the modes of communication [<xref ref-type="bibr" rid="ref43">43</xref>]. One study discussed the framing of effective COVID-19 messages to connect individuals to authoritative content, emphasising the importance of positive and gain-framed messages [<xref ref-type="bibr" rid="ref44">44</xref>]. Similarly, personal experiences increased the salience of public health messaging, particularly in promoting sanitation and hygiene practices [<xref ref-type="bibr" rid="ref45">45</xref>]. Public health messaging during the lockdown in New Zealand showed the importance of consistent messaging principles such as transparency, timeliness, empathy, and clarity [<xref ref-type="bibr" rid="ref46">46</xref>]. None of these studies used defined message categories and the definition and recommendation of message types for different user categories is a major contribution of our study. This will help content creators, particularly health intervention planners, in choosing the right mix of message and sentiment type to increase their engagement.</p><p>A similar study of social media messages explored account type and message structure, taking elements such as hashtags, hyperlinks, mentions, and any images or videos into account but only counting retweets as engagement [<xref ref-type="bibr" rid="ref8">8</xref>]. They found that tweets with hashtags, videos, and pictures were retweeted more often, while tweets with links had fewer retweets. Furthermore, tweets with sentiment were more frequently retweeted than tweets with neutral sentiments. In our study, the user profile and engagement were explored through engagement metrics such as likes, retweets, reply count, and quote count. We found health institutes to be the least engaged user category, while Xie et al [<xref ref-type="bibr" rid="ref8">8</xref>] found national health authorities received more engagement when compared with provincial accounts. However, their analysis was limited to the study of the official (national and provincial) public health agencies&#x2019; Sina Weibo posts only (a China-only microblogging platform).</p><p>This study&#x2019;s novel approach lies in the examination of engagement for a 2-year period across different user categories for different message types and sentiment, providing insights into public&#x2019;s response toward different messages and sources. The volume of data and methodology used allows us to provide insights that were not addressed in the existing body of work. This differs from the current studies with similar research objectives, such as a comparative study between Poland and Jordan [<xref ref-type="bibr" rid="ref47">47</xref>] on social media&#x2019;s role focused on the disparities in platform choices and message efficacy. Another study categorized COVID-19-related tweets into themes to understand public sentiment. The study identified 5 themes for message categories, which were general information, health information, expressions, humor and others, but used a small dataset [<xref ref-type="bibr" rid="ref48">48</xref>]. Furthermore, a study examined Canadian public health tweets, revealing that tweets promoting action garnered more engagement than purely informational ones. However, retweets were used as the measure for engagement, unlike our study, where we took into consideration a more comprehensive method for calculating engagement [<xref ref-type="bibr" rid="ref49">49</xref>]. This is another strength of our study, where we compared engagement across message types and user categories instead of solely depending on likes for comparison.</p><p>Our findings suggest a correlation between message type, sentiment, source credibility, and engagement. Our study shows that audience engages with personal stories and positive messages the most. Also, with varied users, different types of messages yield engagement. Our study provides guidance for social media&#x2013;based public health campaigns for developing messages for maximum engagement.</p></sec><sec id="s4-3"><title>Limitations</title><p>We included just 3 factors (sentiment, user type, and message type) for the analysis, which was leading to variance in our analysis. Other factors not recorded or captured may also influence engagement, for instance, time or day of posts, hashtags, images, etc. For our study, we also excluded tweets from the public user category, which was almost 50% of the dataset as it was not required to address this study&#x2019;s research questions.</p></sec><sec id="s4-4"><title>Conclusion</title><p>Our study provides a framework to develop social media messages according to sentiment and message type for different users. Health professionals and institutes and other users can build on the results to improve effective communication through social media channels.</p></sec></sec></body><back><notes><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are available from the corresponding author on reasonable request</p></sec></notes><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">API</term><def><p>application programming interface</p></def></def-item><def-item><term id="abb2">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb3">STROBE</term><def><p>Strengthening the Reporting of Observational Studies in Epidemiology</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bernhardt</surname><given-names>JM</given-names> </name></person-group><article-title>Communication at the core of effective public health</article-title><source>Am J Public Health</source><year>2004</year><month>12</month><volume>94</volume><issue>12</issue><fpage>2051</fpage><lpage>2053</lpage><pub-id pub-id-type="doi">10.2105/ajph.94.12.2051</pub-id><pub-id pub-id-type="medline">15569948</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="book"><person-group person-group-type="editor"><name name-style="western"><surname>Hornik</surname><given-names>RC</given-names> </name></person-group><source>Public Health Communication: Evidence for Behavior Change</source><year>2002</year><publisher-name>Routledge</publisher-name><pub-id pub-id-type="doi">10.4324/9781410603029</pub-id><pub-id pub-id-type="other">9780805831771</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Plackett</surname><given-names>R</given-names> </name><name name-style="western"><surname>Kaushal</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kassianos</surname><given-names>AP</given-names> </name><etal/></person-group><article-title>Use of social media to promote cancer screening and early diagnosis: scoping review</article-title><source>J Med Internet Res</source><year>2020</year><month>11</month><day>9</day><volume>22</volume><issue>11</issue><fpage>e21582</fpage><pub-id pub-id-type="doi">10.2196/21582</pub-id><pub-id pub-id-type="medline">33164907</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Khan</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Tracey</surname><given-names>S</given-names> </name><name name-style="western"><surname>O&#x2019;Sullivan</surname><given-names>T</given-names> </name><name name-style="western"><surname>Gournis</surname><given-names>E</given-names> </name><name name-style="western"><surname>Johnson</surname><given-names>I</given-names> </name></person-group><article-title>Retiring the flip phones: exploring social media use for managing public health incidents</article-title><source>Disaster Med Public Health Prep</source><year>2019</year><month>12</month><volume>13</volume><issue>5-6</issue><fpage>859</fpage><lpage>867</lpage><pub-id pub-id-type="doi">10.1017/dmp.2018.147</pub-id><pub-id pub-id-type="medline">31218988</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Rempel</surname><given-names>E</given-names> </name><name name-style="western"><surname>Roth</surname><given-names>D</given-names> </name><name name-style="western"><surname>Carenini</surname><given-names>G</given-names> </name><name name-style="western"><surname>Janjua</surname><given-names>NZ</given-names> </name></person-group><article-title>Tracking COVID-19 discourse on twitter in North America: infodemiology study using topic modeling and aspect-based sentiment analysis</article-title><source>J Med Internet Res</source><year>2021</year><month>02</month><day>10</day><volume>23</volume><issue>2</issue><fpage>e25431</fpage><pub-id pub-id-type="doi">10.2196/25431</pub-id><pub-id pub-id-type="medline">33497352</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Carter</surname><given-names>M</given-names> </name></person-group><article-title>How twitter may have helped Nigeria contain ebola</article-title><source>BMJ</source><year>2014</year><month>11</month><day>19</day><volume>349</volume><fpage>g6946</fpage><pub-id pub-id-type="doi">10.1136/bmj.g6946</pub-id><pub-id pub-id-type="medline">25410185</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bartlett</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wurtz</surname><given-names>R</given-names> </name></person-group><article-title>Twitter and public health</article-title><source>J Public Health Manag Pract</source><year>2015</year><volume>21</volume><issue>4</issue><fpage>375</fpage><lpage>383</lpage><pub-id pub-id-type="doi">10.1097/PHH.0000000000000041</pub-id><pub-id pub-id-type="medline">24356087</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xie</surname><given-names>J</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>L</given-names> </name></person-group><article-title>Identifying features of source and message that influence the retweeting of health information on social media during the COVID-19 pandemic</article-title><source>BMC Public Health</source><year>2022</year><month>12</month><volume>22</volume><issue>1</issue><fpage>805</fpage><pub-id pub-id-type="doi">10.1186/s12889-022-13213-w</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ciotti</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ciccozzi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Terrinoni</surname><given-names>A</given-names> </name><name name-style="western"><surname>Jiang</surname><given-names>WC</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>CB</given-names> </name><name name-style="western"><surname>Bernardini</surname><given-names>S</given-names> </name></person-group><article-title>The COVID-19 pandemic</article-title><source>Crit Rev Clin Lab Sci</source><year>2020</year><month>09</month><volume>57</volume><issue>6</issue><fpage>365</fpage><lpage>388</lpage><pub-id pub-id-type="doi">10.1080/10408363.2020.1783198</pub-id><pub-id pub-id-type="medline">32645276</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Al-Dmour</surname><given-names>H</given-names> </name><name name-style="western"><surname>Masa&#x2019;deh</surname><given-names>R</given-names> </name><name name-style="western"><surname>Salman</surname><given-names>A</given-names> </name><name name-style="western"><surname>Abuhashesh</surname><given-names>M</given-names> </name><name name-style="western"><surname>Al-Dmour</surname><given-names>R</given-names> </name></person-group><article-title>Influence of social media platforms on public health protection against the COVID-19 pandemic via the mediating effects of public health awareness and behavioral changes: integrated model</article-title><source>J Med Internet Res</source><year>2020</year><month>08</month><day>19</day><volume>22</volume><issue>8</issue><fpage>e19996</fpage><pub-id pub-id-type="doi">10.2196/19996</pub-id><pub-id pub-id-type="medline">32750004</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gan</surname><given-names>CCR</given-names> </name><name name-style="western"><surname>Feng</surname><given-names>S</given-names> </name><name name-style="western"><surname>Feng</surname><given-names>H</given-names> </name><etal/></person-group><article-title>#WuhanDiary and #WuhanLockdown: gendered posting patterns and behaviours on Weibo during the COVID-19 pandemic</article-title><source>BMJ Glob Health</source><year>2022</year><month>04</month><volume>7</volume><issue>4</issue><fpage>e008149</fpage><pub-id pub-id-type="doi">10.1136/bmjgh-2021-008149</pub-id><pub-id pub-id-type="medline">35414567</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kouzy</surname><given-names>R</given-names> </name><name name-style="western"><surname>Abi Jaoude</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kraitem</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Coronavirus goes viral: quantifying the COVID-19 misinformation epidemic on twitter</article-title><source>Cureus</source><year>2020</year><month>03</month><day>13</day><volume>12</volume><issue>3</issue><fpage>e7255</fpage><pub-id pub-id-type="doi">10.7759/cureus.7255</pub-id><pub-id pub-id-type="medline">32292669</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Llewellyn</surname><given-names>S</given-names> </name></person-group><article-title>Covid-19: how to be careful with trust and expertise on social media</article-title><source>BMJ</source><year>2020</year><month>03</month><day>25</day><volume>368</volume><fpage>m1160</fpage><pub-id pub-id-type="doi">10.1136/bmj.m1160</pub-id><pub-id pub-id-type="medline">32213480</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lenoir</surname><given-names>P</given-names> </name><name name-style="western"><surname>Moulahi</surname><given-names>B</given-names> </name><name name-style="western"><surname>Az&#x00E9;</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bringay</surname><given-names>S</given-names> </name><name name-style="western"><surname>Mercier</surname><given-names>G</given-names> </name><name name-style="western"><surname>Carbonnel</surname><given-names>F</given-names> </name></person-group><article-title>Raising awareness about cervical cancer using twitter: content analysis of the 2015 #SmearForSmear campaign</article-title><source>J Med Internet Res</source><year>2017</year><month>10</month><day>16</day><volume>19</volume><issue>10</issue><fpage>e344</fpage><pub-id pub-id-type="doi">10.2196/jmir.8421</pub-id><pub-id pub-id-type="medline">29038096</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kummervold</surname><given-names>PE</given-names> </name><name name-style="western"><surname>Martin</surname><given-names>S</given-names> </name><name name-style="western"><surname>Dada</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Categorizing vaccine confidence with a transformer-based machine learning model: analysis of nuances of vaccine sentiment in twitter discourse</article-title><source>JMIR Med Inform</source><year>2021</year><month>10</month><day>8</day><volume>9</volume><issue>10</issue><fpage>e29584</fpage><pub-id pub-id-type="doi">10.2196/29584</pub-id><pub-id pub-id-type="medline">34623312</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="preprint"><person-group person-group-type="author"><name name-style="western"><surname>Sanh</surname><given-names>V</given-names> </name><name name-style="western"><surname>Debut</surname><given-names>L</given-names> </name><name name-style="western"><surname>Chaumond</surname><given-names>J</given-names> </name><name name-style="western"><surname>Wolf</surname><given-names>T</given-names> </name></person-group><article-title>DistilBERT, a distilled version of BERT: smaller, faster, cheaper and lighter</article-title><source>arXiv</source><comment>Preprint posted online on  Oct 2, 2019</comment><pub-id pub-id-type="doi">10.48550/arXiv.1910.01108</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="preprint"><person-group person-group-type="author"><name name-style="western"><surname>P&#x00E9;rez</surname><given-names>JM</given-names> </name><name name-style="western"><surname>Rajngewerc</surname><given-names>M</given-names> </name><name name-style="western"><surname>Giudici</surname><given-names>JC</given-names> </name><etal/></person-group><article-title>Pysentimiento: a python toolkit for opinion mining and social NLP tasks</article-title><source>arXiv</source><comment>Preprint posted online on  Jun 17, 2021</comment><pub-id pub-id-type="doi">10.48550/arXiv.2106.09462</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Loureiro</surname><given-names>D</given-names> </name><name name-style="western"><surname>Barbieri</surname><given-names>F</given-names> </name><name name-style="western"><surname>Neves</surname><given-names>L</given-names> </name><name name-style="western"><surname>Espinosa Anke</surname><given-names>L</given-names> </name><name name-style="western"><surname>Camacho-collados</surname><given-names>J</given-names> </name></person-group><article-title>TimeLMs: diachronic language models from twitter</article-title><conf-name>Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics</conf-name><conf-date>May 22-27, 2022</conf-date><conf-loc>Dublin, Ireland</conf-loc><comment><ext-link ext-link-type="uri" xlink:href="https://aclanthology.org/2022.acl-demo">https://aclanthology.org/2022.acl-demo</ext-link></comment><pub-id pub-id-type="doi">10.18653/v1/2022.acl-demo.25</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Huilgol</surname><given-names>P</given-names> </name></person-group><article-title>Accuracy vs F1-score</article-title><source>Medium</source><year>2019</year><access-date>2025-03-07</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://medium.com/analytics-vidhya/accuracy-vs-f1-score-6258237beca2">https://medium.com/analytics-vidhya/accuracy-vs-f1-score-6258237beca2</ext-link></comment></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Kundu</surname><given-names>R</given-names> </name></person-group><article-title>F1 score in machine learning: intro &#x0026; calculation</article-title><source>V7labs</source><year>2022</year><access-date>2025-03-07</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.v7labs.com/blog/f1-score-guide">https://www.v7labs.com/blog/f1-score-guide</ext-link></comment></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cole-Lewis</surname><given-names>H</given-names> </name><name name-style="western"><surname>Pugatch</surname><given-names>J</given-names> </name><name name-style="western"><surname>Sanders</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Social listening: a content analysis of e-cigarette discussions on twitter</article-title><source>J Med Internet Res</source><year>2015</year><month>10</month><day>27</day><volume>17</volume><issue>10</issue><fpage>e243</fpage><pub-id pub-id-type="doi">10.2196/jmir.4969</pub-id><pub-id pub-id-type="medline">26508089</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hsieh</surname><given-names>HF</given-names> </name><name name-style="western"><surname>Shannon</surname><given-names>SE</given-names> </name></person-group><article-title>Three approaches to qualitative content analysis</article-title><source>Qual Health Res</source><year>2005</year><month>11</month><volume>15</volume><issue>9</issue><fpage>1277</fpage><lpage>1288</lpage><pub-id pub-id-type="doi">10.1177/1049732305276687</pub-id><pub-id pub-id-type="medline">16204405</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Schopf</surname><given-names>T</given-names> </name><name name-style="western"><surname>Braun</surname><given-names>D</given-names> </name><name name-style="western"><surname>Matthes</surname><given-names>F</given-names> </name></person-group><article-title>Semantic label representations with lbl2vec: a similarity-based approach for unsupervised text classification</article-title><source>Web Information Systems and Technologies</source><year>2023</year><publisher-name>Springer, Cham</publisher-name><fpage>59</fpage><lpage>73</lpage><pub-id pub-id-type="doi">10.1007/978-3-031-24197-0_4</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Eldallal</surname><given-names>A</given-names> </name><name name-style="western"><surname>Barbu</surname><given-names>E</given-names> </name></person-group><article-title>BibRank: automatic keyphrase extraction platform using metadata</article-title><source>Information</source><year>2023</year><volume>14</volume><issue>10</issue><fpage>549</fpage><pub-id pub-id-type="doi">10.3390/info14100549</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gough</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hunter</surname><given-names>RF</given-names> </name><name name-style="western"><surname>Ajao</surname><given-names>O</given-names> </name><etal/></person-group><article-title>Tweet for behavior change: using social media for the dissemination of public health messages</article-title><source>JMIR Public Health Surveill</source><year>2017</year><month>03</month><day>23</day><volume>3</volume><issue>1</issue><fpage>e14</fpage><pub-id pub-id-type="doi">10.2196/publichealth.6313</pub-id><pub-id pub-id-type="medline">28336503</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Semiz</surname><given-names>G</given-names> </name><name name-style="western"><surname>Berger</surname><given-names>PD</given-names> </name></person-group><article-title>Determining the factors that drive twitter engagement-rates</article-title><source>ABR</source><year>2017</year><volume>5</volume><issue>2</issue><comment><ext-link ext-link-type="uri" xlink:href="http://scholarpublishing.org/index.php/ABR/issue/view/135">http://scholarpublishing.org/index.php/ABR/issue/view/135</ext-link></comment><pub-id pub-id-type="doi">10.14738/abr.52.2700</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Katie Sehl</surname><given-names>KM</given-names> </name></person-group><article-title>Engagement rate calculator</article-title><source>IndiKit</source><year>2024</year><access-date>2025-03-07</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.indikit.net/document/371-engagement-rate-calculator">https://www.indikit.net/document/371-engagement-rate-calculator</ext-link></comment></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Voorveld</surname><given-names>HAM</given-names> </name><name name-style="western"><surname>van Noort</surname><given-names>G</given-names> </name><name name-style="western"><surname>Muntinga</surname><given-names>DG</given-names> </name><name name-style="western"><surname>Bronner</surname><given-names>F</given-names> </name></person-group><article-title>Engagement with social media and social media advertising: the differentiating role of platform type</article-title><source>J Advert</source><year>2018</year><month>01</month><day>2</day><volume>47</volume><issue>1</issue><fpage>38</fpage><lpage>54</lpage><pub-id pub-id-type="doi">10.1080/00913367.2017.1405754</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Melton</surname><given-names>CA</given-names> </name><name name-style="western"><surname>White</surname><given-names>BM</given-names> </name><name name-style="western"><surname>Davis</surname><given-names>RL</given-names> </name><name name-style="western"><surname>Bednarczyk</surname><given-names>RA</given-names> </name><name name-style="western"><surname>Shaban-Nejad</surname><given-names>A</given-names> </name></person-group><article-title>Fine-tuned sentiment analysis of COVID-19 vaccine-related social media data: comparative study</article-title><source>J Med Internet Res</source><year>2022</year><month>10</month><day>17</day><volume>24</volume><issue>10</issue><fpage>e40408</fpage><pub-id pub-id-type="doi">10.2196/40408</pub-id><pub-id pub-id-type="medline">36174192</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Latkin</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Dayton</surname><given-names>L</given-names> </name><name name-style="western"><surname>Miller</surname><given-names>JR</given-names> </name><etal/></person-group><article-title>Behavioral and attitudinal correlates of trusted sources of COVID-19 vaccine information in the US</article-title><source>Behav Sci (Basel)</source><year>2021</year><month>04</month><day>20</day><volume>11</volume><issue>4</issue><fpage>56</fpage><pub-id pub-id-type="doi">10.3390/bs11040056</pub-id><pub-id pub-id-type="medline">33924118</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jucks</surname><given-names>R</given-names> </name><name name-style="western"><surname>Thon</surname><given-names>FM</given-names> </name></person-group><article-title>Better to have many opinions than one from an expert? Social validation by one trustworthy source versus the masses in online health forums</article-title><source>Comput Human Behav</source><year>2017</year><month>05</month><volume>70</volume><fpage>375</fpage><lpage>381</lpage><pub-id pub-id-type="doi">10.1016/j.chb.2017.01.019</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>X</given-names> </name></person-group><article-title>Online health communities influence people&#x2019;s health behaviors in the context of COVID-19</article-title><source>PLOS ONE</source><year>2023</year><volume>18</volume><issue>4</issue><fpage>e0282368</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0282368</pub-id><pub-id pub-id-type="medline">37053287</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lustria</surname><given-names>MLA</given-names> </name><name name-style="western"><surname>Noar</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Cortese</surname><given-names>J</given-names> </name><name name-style="western"><surname>Van Stee</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Glueckauf</surname><given-names>RL</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>J</given-names> </name></person-group><article-title>A meta-analysis of web-delivered tailored health behavior change interventions</article-title><source>J Health Commun</source><year>2013</year><volume>18</volume><issue>9</issue><fpage>1039</fpage><lpage>1069</lpage><pub-id pub-id-type="doi">10.1080/10810730.2013.768727</pub-id><pub-id pub-id-type="medline">23750972</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Maibach</surname><given-names>EW</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Parrott</surname><given-names>RL</given-names> </name></person-group><source>Designing Health Messages: Approaches from Communication Theory and Public Health Practice</source><year>1995</year><publisher-name>SAGE Publication</publisher-name><pub-id pub-id-type="doi">10.4135/9781452233451</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lutkenhaus</surname><given-names>RO</given-names> </name><name name-style="western"><surname>Jansz</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bouman</surname><given-names>MP</given-names> </name></person-group><article-title>Tailoring in the digital era: Stimulating dialogues on health topics in collaboration with social media influencers</article-title><source>Digit Health</source><year>2019</year><volume>5</volume><fpage>2055207618821521</fpage><pub-id pub-id-type="doi">10.1177/2055207618821521</pub-id><pub-id pub-id-type="medline">30729023</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xue</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Twitter discussions and emotions about the COVID-19 pandemic: machine learning approach</article-title><source>J Med Internet Res</source><year>2020</year><month>11</month><day>25</day><volume>22</volume><issue>11</issue><fpage>e20550</fpage><pub-id pub-id-type="doi">10.2196/20550</pub-id><pub-id pub-id-type="medline">33119535</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Xue</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>C</given-names> </name><name name-style="western"><surname>Zheng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Li</surname><given-names>S</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>T</given-names> </name></person-group><article-title>Public discourse and sentiment during the COVID 19 pandemic: Using Latent Dirichlet Allocation for topic modeling on Twitter</article-title><source>PLoS ONE</source><year>2020</year><volume>15</volume><issue>9</issue><fpage>e0239441</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0239441</pub-id><pub-id pub-id-type="medline">32976519</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Boon-Itt</surname><given-names>S</given-names> </name><name name-style="western"><surname>Skunkan</surname><given-names>Y</given-names> </name></person-group><article-title>Public perception of the COVID-19 pandemic on Twitter: sentiment analysis and topic modeling study</article-title><source>JMIR Public Health Surveill</source><year>2020</year><month>11</month><day>11</day><volume>6</volume><issue>4</issue><fpage>e21978</fpage><pub-id pub-id-type="doi">10.2196/21978</pub-id><pub-id pub-id-type="medline">33108310</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Worrall</surname><given-names>AP</given-names> </name><name name-style="western"><surname>Kelly</surname><given-names>C</given-names> </name><name name-style="western"><surname>O&#x2019;Neill</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Online search trends influencing anticoagulation in patients with COVID-19: observational study</article-title><source>JMIR Form Res</source><year>2021</year><month>08</month><day>31</day><volume>5</volume><issue>8</issue><fpage>e21817</fpage><pub-id pub-id-type="doi">10.2196/21817</pub-id><pub-id pub-id-type="medline">34292865</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>S</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>J</given-names> </name></person-group><article-title>Understanding behavioral intentions toward COVID-19 vaccines: theory-based content analysis of tweets</article-title><source>J Med Internet Res</source><year>2021</year><month>05</month><day>12</day><volume>23</volume><issue>5</issue><fpage>e28118</fpage><pub-id pub-id-type="doi">10.2196/28118</pub-id><pub-id pub-id-type="medline">33939625</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hussain</surname><given-names>A</given-names> </name><name name-style="western"><surname>Tahir</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hussain</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>Artificial intelligence-enabled analysis of public attitudes on Facebook and Twitter toward COVID-19 vaccines in the United Kingdom and the United States: observational study</article-title><source>J Med Internet Res</source><year>2021</year><month>04</month><day>5</day><volume>23</volume><issue>4</issue><fpage>e26627</fpage><pub-id pub-id-type="doi">10.2196/26627</pub-id><pub-id pub-id-type="medline">33724919</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lyu</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Han</surname><given-names>EL</given-names> </name><name name-style="western"><surname>Luli</surname><given-names>GK</given-names> </name></person-group><article-title>COVID-19 vaccine-related discussion on twitter: topic modeling and sentiment analysis</article-title><source>J Med Internet Res</source><year>2021</year><month>06</month><day>29</day><volume>23</volume><issue>6</issue><fpage>e24435</fpage><pub-id pub-id-type="doi">10.2196/24435</pub-id><pub-id pub-id-type="medline">34115608</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Berg</surname><given-names>SH</given-names> </name><name name-style="western"><surname>O&#x2019;Hara</surname><given-names>JK</given-names> </name><name name-style="western"><surname>Shortt</surname><given-names>MT</given-names> </name><etal/></person-group><article-title>Health authorities&#x2019; health risk communication with the public during pandemics: a rapid scoping review</article-title><source>BMC Public Health</source><year>2021</year><month>07</month><day>15</day><volume>21</volume><issue>1</issue><fpage>1401</fpage><pub-id pub-id-type="doi">10.1186/s12889-021-11468-3</pub-id><pub-id pub-id-type="medline">34266403</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pattison</surname><given-names>AB</given-names> </name><name name-style="western"><surname>Reinfelde</surname><given-names>M</given-names> </name><name name-style="western"><surname>Chang</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Finding the facts in an infodemic: framing effective COVID-19 messages to connect people to authoritative content</article-title><source>BMJ Glob Health</source><year>2022</year><month>02</month><volume>7</volume><issue>2</issue><fpage>e007582</fpage><pub-id pub-id-type="doi">10.1136/bmjgh-2021-007582</pub-id><pub-id pub-id-type="medline">35131808</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pakhtigian</surname><given-names>EL</given-names> </name><name name-style="western"><surname>Downs-Tepper</surname><given-names>H</given-names> </name><name name-style="western"><surname>Anson</surname><given-names>A</given-names> </name><name name-style="western"><surname>Pattanayak</surname><given-names>SK</given-names> </name></person-group><article-title>COVID-19, public health messaging, and sanitation and hygiene practices in rural India</article-title><source>J Water Sanit Hyg Dev</source><year>2022</year><month>11</month><day>1</day><volume>12</volume><issue>11</issue><fpage>828</fpage><lpage>837</lpage><pub-id pub-id-type="doi">10.2166/washdev.2022.134</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Officer</surname><given-names>TN</given-names> </name><name name-style="western"><surname>McKinlay</surname><given-names>E</given-names> </name><name name-style="western"><surname>Imlach</surname><given-names>F</given-names> </name><name name-style="western"><surname>Kennedy</surname><given-names>J</given-names> </name><name name-style="western"><surname>Churchward</surname><given-names>M</given-names> </name><name name-style="western"><surname>McBride-Henry</surname><given-names>K</given-names> </name></person-group><article-title>Experiences of New Zealand public health messaging while in lockdown</article-title><source>Aust N Z J Public Health</source><year>2022</year><month>12</month><volume>46</volume><issue>6</issue><fpage>735</fpage><lpage>737</lpage><pub-id pub-id-type="doi">10.1111/1753-6405.13297</pub-id><pub-id pub-id-type="medline">36190208</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abuhashesh</surname><given-names>MY</given-names> </name><name name-style="western"><surname>Al-Dmour</surname><given-names>H</given-names> </name><name name-style="western"><surname>Masa&#x2019;deh</surname><given-names>R</given-names> </name><etal/></person-group><article-title>The role of social media in raising public health awareness during the pandemic COVID-19: an international comparative study</article-title><source>Informatics (MDPI)</source><year>2021</year><volume>8</volume><issue>4</issue><fpage>80</fpage><pub-id pub-id-type="doi">10.3390/informatics8040080</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Karmegam</surname><given-names>D</given-names> </name><name name-style="western"><surname>Mapillairaju</surname><given-names>B</given-names> </name></person-group><article-title>What people share about the COVID-19 outbreak on Twitter? An exploratory analysis</article-title><source>BMJ Health Care Inform</source><year>2020</year><month>11</month><volume>27</volume><issue>3</issue><fpage>e100133</fpage><pub-id pub-id-type="doi">10.1136/bmjhci-2020-100133</pub-id><pub-id pub-id-type="medline">33214193</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Slavik</surname><given-names>CE</given-names> </name><name name-style="western"><surname>Buttle</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sturrock</surname><given-names>SL</given-names> </name><name name-style="western"><surname>Darlington</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Yiannakoulias</surname><given-names>N</given-names> </name></person-group><article-title>Examining tweet content and engagement of Canadian public health agencies and decision makers during COVID-19: mixed methods analysis</article-title><source>J Med Internet Res</source><year>2021</year><month>03</month><day>11</day><volume>23</volume><issue>3</issue><fpage>e24883</fpage><pub-id pub-id-type="doi">10.2196/24883</pub-id><pub-id pub-id-type="medline">33651705</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Sentiment analysis.</p><media xlink:href="formative_v9i1e59687_app1.xlsx" xlink:title="XLSX File, 44 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>User classification.</p><media xlink:href="formative_v9i1e59687_app2.xlsx" xlink:title="XLSX File, 89 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Message classification.</p><media xlink:href="formative_v9i1e59687_app3.xlsx" xlink:title="XLSX File, 80 KB"/></supplementary-material><supplementary-material id="app4"><label>Multimedia Appendix 4</label><p>Results of zero-inflated model.</p><media xlink:href="formative_v9i1e59687_app4.xlsx" xlink:title="XLSX File, 11 KB"/></supplementary-material><supplementary-material id="app5"><label>Checklist 1</label><p>STROBE checklist for cross-sectional studies.</p><media xlink:href="formative_v9i1e59687_app5.doc" xlink:title="DOC File, 94 KB"/></supplementary-material></app-group></back></article>