<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id><journal-id journal-id-type="publisher-id">formative</journal-id><journal-id journal-id-type="index">27</journal-id><journal-title>JMIR Formative Research</journal-title><abbrev-journal-title>JMIR Form Res</abbrev-journal-title><issn pub-type="epub">2561-326X</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e66237</article-id><article-id pub-id-type="doi">10.2196/66237</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Surveillance of Twitter Data on COVID-19 Symptoms During the Omicron Variant Period: A Sentiment Analysis</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Zhang</surname><given-names>Kaiyue</given-names></name><degrees>BS, MPH</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Guo</surname><given-names>Zhaojin</given-names></name><degrees>BS, MPH</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Ai</surname><given-names>Yujie</given-names></name><degrees>BEng, MSc</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Li</surname><given-names>An-Ran</given-names></name><degrees>BS, MPH</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Li</surname><given-names>Anlin</given-names></name><degrees>BS,MSc</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Liu</surname><given-names>Ziyu</given-names></name><degrees>MSc</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Tse</surname><given-names>Yittie Yi Ting</given-names></name><degrees>MSc, MPH</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff5">5</xref><xref ref-type="aff" rid="aff7">7</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhou</surname><given-names>Xinyu</given-names></name><degrees>BS, MPH</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Liu</surname><given-names>Taoran</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Xiong</surname><given-names>Chuxi</given-names></name><degrees>BSc</degrees><xref ref-type="aff" rid="aff8">8</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Huang</surname><given-names>Jian</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff9">9</xref><xref ref-type="aff" rid="aff10">10</xref><xref ref-type="aff" rid="aff11">11</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Ming</surname><given-names>Wai-kit</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff12">12</xref></contrib></contrib-group><aff id="aff1"><institution>School of Public Health, Li Ka Shing Faculty of Medicine, University of Hong Kong</institution><addr-line>Hong Kong</addr-line><country>China (Hong Kong)</country></aff><aff id="aff2"><institution>Department of Paediatrics and Adolescent Medicine, School of Clinical Medicine, University of Hong Kong</institution><addr-line>Hong Kong</addr-line><country>China (Hong Kong)</country></aff><aff id="aff3"><institution>Department of Infectious Diseases and Public Health, Jockey Club College of Veterinary Medicine and Life Sciences, City University of Hong Kong</institution><addr-line>To Yuen Building, 31 To Yuen Street</addr-line><addr-line>Hong Kong</addr-line><country>China (Hong Kong)</country></aff><aff id="aff4"><institution>Department of Family Medicine and Primary Care, Li Ka Shing Faculty of Medicine, School of Clinical Medicine, University of Hong Kong</institution><addr-line>Hong Kong</addr-line><country>China (Hong Kong)</country></aff><aff id="aff5"><institution>Department of Pharmacology and Pharmacy, Li Ka Shing Faculty of Medicine, University of Hong Kong</institution><addr-line>Hong Kong</addr-line><country>China (Hong Kong)</country></aff><aff id="aff6"><institution>Department of Medical Record, Peking University Third Hospital</institution><addr-line>Beijing</addr-line><country>China</country></aff><aff id="aff7"><institution>Department of Health, The Government of the Hong Kong Special Administrative Region</institution><addr-line>Hong Kong</addr-line><country>China (Hong Kong)</country></aff><aff id="aff8"><institution>Department of Science, University of Waterloo</institution><addr-line>Waterloo</addr-line><addr-line>ON</addr-line><country>Canada</country></aff><aff id="aff9"><institution>Institute for Human Development and Potential (IHDP), ASTAR</institution><addr-line>Singapore</addr-line><country>Singapore</country></aff><aff id="aff10"><institution>Bioinformatics Institute (BII), ASTAR</institution><addr-line>Singapore</addr-line><country>Singapore</country></aff><aff id="aff11"><institution>Human Potential Translational Research Programme, National University of Singapore</institution><addr-line>Singapore</addr-line><country>Singapore</country></aff><aff id="aff12"><institution>Institute of Global Governance and Innovation for a Shared Future, City University of Hong Kong</institution><addr-line>Hong Kong</addr-line><country>China (Hong Kong)</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Jarynowski</surname><given-names>Andrzej</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Wai-kit Ming, PhD, Department of Infectious Diseases and Public Health, Jockey Club College of Veterinary Medicine and Life Sciences, City University of Hong Kong, To Yuen Building, 31 To Yuen Street, Hong Kong, China (Hong Kong), 852 34426956; <email>wkming2@cityu.edu.hk</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>23</day><month>9</month><year>2025</year></pub-date><volume>9</volume><elocation-id>e66237</elocation-id><history><date date-type="received"><day>07</day><month>09</month><year>2024</year></date><date date-type="rev-recd"><day>17</day><month>06</month><year>2025</year></date><date date-type="accepted"><day>27</day><month>06</month><year>2025</year></date></history><copyright-statement>&#x00A9; Kaiyue Zhang, Zhaojin Guo, Yujie Ai, An-Ran Li, Anlin Li, Ziyu Liu, Yittie Yi Ting Tse, Xinyu Zhou, Taoran Liu, Chuxi Xiong, Jian Huang, Wai-kit Ming. Originally published in JMIR Formative Research (<ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>), 23.9.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://formative.jmir.org/2025/1/e66237"/><abstract><sec><title>Background</title><p>The global outbreak of COVID-19 has significantly impacted health care systems and has necessitated timely access to information for effective decision-making by health care authorities. Conventional methods for collecting patient data and analyzing virus mutations are resource-intensive. In the current era of rapid internet development, information on COVID-19 infections could be collected by a novel approach that leverages social media, particularly Twitter (subsequently rebranded X).</p></sec><sec><title>Objective</title><p>The aim of this study was to analyze the trending patterns of tweets containing information about various COVID-19 symptoms, explore their synchronization and correlation with conventional monitoring data, and provide insights into the evolution of the virus. We categorized tweet sentiments to understand the predictive power of negative emotions of different symptoms in anticipating the emergence of new Omicron subvariants and offering real-time assistance to affected individuals.</p></sec><sec sec-type="methods"><title>Methods</title><p>Relevant user tweets from 2022 containing information about COVID-19 symptoms were extracted from Twitter. Our fine-tuned RoBERTa model for sentiment analysis, achieving 99.7% accuracy for sentiment analysis, was used to categorize tweets as negative, positive, or neutral. Joinpoint regression analysis was used to examine the trends in weekly negative tweets related to COVID-19 symptoms, aligning these trends with the transition periods of SARS-CoV-2 Omicron subvariants from 2022. Real-time Twitter users with negative sentiments were geographically plotted. A total of 105,934 tweets related to fever, 120,257 to cough, 55,790 to headache, 101,220 to sore throat, 3410 to vomiting, and 5913 to diarrhea were collected.</p></sec><sec sec-type="results"><title>Results</title><p>The most prominent topics of discussion were fever, sore throat, and headache. The weekly average daily tweets exhibited different fluctuation patterns in different stages of subvariants. Specifically, fever-related negative tweets were more sensitive to Omicron subvariant evolution, while discussions of other symptoms declined and stabilized following the emergence of the BA.2 variant. Negative discussions about fever rose to nearly 40% at the beginning of 2022 and showed 2 distinct peaks during the absolute dominance of BA.2 and BA.5, respectively. Headache and throat-related negative sentiment exhibited the highest levels among the analyzed symptoms. Tweets containing geographic information accounted for 1.5% (1351/391,508) of all collected data, with negative sentiment users making up 0.35% (5873/391,508) of all related tweets.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study underscores the potential of using social media, particularly tweet trends, for real-time analysis of COVID-19 infections and has demonstrated correlations with major symptoms. The degree of negative emotions expressed in tweets is valuable in predicting the emergence of new Omicron subvariants of COVID-19 and facilitating the provision of timely assistance to affected individuals.</p></sec></abstract><kwd-group><kwd>COVID-19</kwd><kwd>social media surveillance</kwd><kwd>Twitter</kwd><kwd>natural language processing</kwd><kwd>real-time analysis</kwd><kwd>sentiment analysis</kwd><kwd>virus mutations</kwd><kwd>geographic tracking</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Symptom surveillance is crucial for public health and monitoring the transmission dynamics of infectious diseases [<xref ref-type="bibr" rid="ref1">1</xref>]. Surveillance involves indicator-based and event-based surveillance [<xref ref-type="bibr" rid="ref2">2</xref>], of which the former uses established protocols to collect structured data based on correlations between cases and hospital diagnostic data. Currently, the identification and variation of virus symptoms are studied in large populations in hospitals. However, delays in testing and reporting among institutions impact the timeliness of decision-making, hinder the prompt mobilization of resources and public education after determining the symptoms of mutated viruses, and potentially lead to losses and public panic [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>Event-based surveillance can be performed using nonconventional data sources, such as social media, news, and public health networks, and excels in the timely identification of emerging public health issues. There is a trend of growing reliance on social media and search engines for pandemic-related data collection. Health systems are integrating conventional and advanced techniques to obtain more immediate and comprehensive data, which enhances the formulation of health policy.</p><p>Since the H1N1 influenza epidemic in 2009, social media has started to play a pivotal role in surveillance. For instance, HealthMap combines formal sources such as the World Health Organization (WHO) and the Centers for Disease Control and Prevention (CDC) with informal data sources such as Twitter to reduce reporting delays [<xref ref-type="bibr" rid="ref4">4</xref>]. A study on the 2010 cholera outbreak in Haiti assessed the correlation between unofficial data sources (eg, HealthMap and Twitter) and government-reported cases. The effective reproduction number was also estimated using these nonofficial sources [<xref ref-type="bibr" rid="ref5">5</xref>]. Twitter has also been applied to monitor dengue fever in analyses focusing on various aspects of tweets to identify potential cases [<xref ref-type="bibr" rid="ref6">6</xref>], especially sociodemographic characteristics [<xref ref-type="bibr" rid="ref7">7</xref>].</p><p>Social media surveillance has continued to progress for other infectious diseases, including Ebola [<xref ref-type="bibr" rid="ref8">8</xref>], Middle East respiratory syndrome [<xref ref-type="bibr" rid="ref9">9</xref>], and Zika [<xref ref-type="bibr" rid="ref10">10</xref>]. Retrospective prediction models based on Google and Twitter data have demonstrated potential in the early detection of suspected Zika cases [<xref ref-type="bibr" rid="ref10">10</xref>]. In the era of the COVID-19 pandemic, research has shifted focus toward understanding risk factors for the disease [<xref ref-type="bibr" rid="ref11">11</xref>], its symptoms and mental health impacts [<xref ref-type="bibr" rid="ref12">12</xref>], and using sentiment analysis to combat the spread of misinformation [<xref ref-type="bibr" rid="ref13">13</xref>]. Mackey et al [<xref ref-type="bibr" rid="ref14">14</xref>] used machine learning to identify COVID-19 symptoms and related experiences from Twitter, highlighting testing challenges and underreporting issues. A recurrent neural network has also been used to classify sentiment and analyze manifestations [<xref ref-type="bibr" rid="ref15">15</xref>].</p><p>Wu et al [<xref ref-type="bibr" rid="ref16">16</xref>] demonstrated the dynamic changes of COVID-19 symptoms over time, from the early typical respiratory symptoms to the later musculoskeletal and nervous system symptoms. We propose a Twitter-based symptom surveillance method for COVID-19 infections focusing on 6 typical symptoms. We chose Twitter (subsequently rebranded as X) as a data source to collect public information on people with COVID-19 from 2022. A previous study collected a large number of tweets related to the Omicron variant and classified them based on sentiment, language, source, and type of tweet, among other aspects [<xref ref-type="bibr" rid="ref17">17</xref>]. We also analyzed the sentiment of their tweets to determine the severity of the impact for each individual. Our model can detect the emotions of users with COVID-19 on a geographic map in real time. This method monitors the dynamic epidemiological situation, especially the evolution of symptoms of Omicron subvariants, and explores correlations with public sentiment. The findings could assist in making timely governmental decisions for strengthening pandemic prevention and control.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview</title><p>This study used quantitative and qualitative methods for collecting and analyzing tweets related to COVID-19 to synchronize, forecast, and track the evolution of the different COVID-19 symptoms. The focus was on symptoms, the emotions of those who have been infected, and geographical information. We identified tweets related to COVID-19 symptoms as our key search criterion and collected tweets containing any reference to the occurrence of the disease and its symptoms from January 1, 2022, to December 31, 2022. The data were prepared in 3 steps: (1) data selection, (2) data collection, and (3) data cleaning.</p></sec><sec id="s2-2"><title>Data Selection</title><p>We collected tweets related to COVID-19 symptoms using the following key search terms: &#x201C;fever,&#x201D; &#x201C;cough,&#x201D; &#x201C;headache,&#x201D; &#x201C;throat,&#x201D; and &#x201C;vomit,&#x201D; which are related to common symptoms of COVID-19 according to the CDC in October 2022 [<xref ref-type="bibr" rid="ref18">18</xref>]. We collected data if any of these terms and the term &#x201C;COVID&#x201D; appeared in a published tweet. We chose daily Twitter data from 2022 because of its higher maturity in test technologies and monitoring systems, which supported the meaningful comparison between Twitter data and clinical data.</p></sec><sec id="s2-3"><title>Data Collection</title><p>During the data collection phase, daily tweets in English were gathered from Twitter using Python scripts. The advanced search function on Twitter was used to extract comprehensive datasets, followed by a data-validation process to maintain collection accuracy. Additional data crawling was conducted to reinforce the integrity of the dataset. Official numbers of weekly confirmed cases were reported by the WHO [<xref ref-type="bibr" rid="ref19">19</xref>]. We used 3 continuous modules to analyze COVID-19 symptoms for the real-time surveillance of people infected with COVID-19: temporal analysis, sentiment analysis, and user-feature analysis.</p></sec><sec id="s2-4"><title>Sentiment Analysis</title><p>After data collection, we preprocessed the data of each tweet using Python (Python Software Foundation) and R (The R Foundation), which filtered out tweets with significant amounts of garbled characters before inputting them into the sentiment analysis model. The sentiments expressed in short tweets are generally more direct, which makes it easier to determine the sentiment category. To accurately determine their sentiment, both training and inference were conducted on all tweets using the latest natural language processing (NLP) model, the RoBERTa base model [<xref ref-type="bibr" rid="ref20">20</xref>], in the Hugging Face repository.</p><p>We identified the tweets of users who were infected with COVID-19, predicted the probability of different types of emotions in each tweet (positive, neutral, and negative), and selected the category with the highest probability as the sentiment result. We used Omicron subvariants data from the weekly epidemiology reports of the WHO to create a geographical map of Omicron subvariants&#x2019; proportions over 1 year. The WHO data are obtained through geographical coverage and align with our worldwide Twitter data. The accuracy of sentiment analysis for the 3 categories was 99.7%.</p><p>We performed a joinpoint regression to analyze changes in counts of weekly negative tweets. The subvariant transition periods are set as the week during which a new Omicron subvariant replaces the previous subvariant, plus 1 week before and after. We aim to identify whether the significant joinpoints captured by the joinpoint regression fall within these subvariant transition periods.</p></sec><sec id="s2-5"><title>Geographical Analysis</title><p>In the completed map, each red dot represents a tweet related to COVID-19 symptoms. Geographic information about Twitter users is obtained by using the Twitter API to see what geographic information exists, or by analyzing metadata or tweets to infer geographic information. The map provides a quick display of the daily count of negative tweets and the tally of tweets concerning COVID-19 in a specific region while summarizing the negative, positive, and neutral sentiments. A line graph shows the fluctuations in the quantity of COVID-19&#x2013;related tweets regionally over time.</p></sec><sec id="s2-6"><title>Ethical Considerations</title><p>This study did not involve human participants or interventions, and thus no informed consent was required. The analysis relied solely on publicly available Twitter data, ensuring the anonymity of individuals. Any personal information collected was handled in accordance with ethical guidelines, and no identifiable user data are disclosed in this paper.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Real-Time Analysis of Tweets Related to COVID-19 Symptoms From 2022</title><p>The collected data encompassed 6 symptoms mentioned in tweets, of which 105,934 tweets were related to fever, 120,257 were related to cough, 55,790 were related to headache, 101,220 were related to sore throat, 3410 were related to vomiting, and 5913 were related to diarrhea (<xref ref-type="fig" rid="figure1">Figure 1</xref>).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>A flowchart of screening for COVID-19 symptom&#x2013;related tweets. NLP: natural language processing; WHO: World Health Organization.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e66237_fig01.png"/></fig><p><xref ref-type="fig" rid="figure2">Figure 2</xref> shows the trend of the weekly ratio of symptom-related tweets and new cases of COVID-19 worldwide. We divided the year 2022 into 4 periods based on the prevalence of different variants. There were 4 peaks in the number of new cases throughout the year, which occurred in January, March, July, and December. Furthermore, the fluctuations in ratios of weekly symptom tweets demonstrated a certain level of synchronous pattern with the evolution of Omicron variants and waves of new cases.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Weekly average severity of daily tweets about symptoms and confirmed cases.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e66237_fig02.png"/></fig><p>According to the gathered symptom surveillance data, discussions surrounding fever, sore throat, and headache were the most prominent, which was consistent with real-world observations. Fever was common from the beginning of the pandemic, whereas sore throat and headache became more prevalent during the Omicron period [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref22">22</xref>] and attracted increased attention from multiple public health authorities [<xref ref-type="bibr" rid="ref23">23</xref>].</p><p>In <xref ref-type="fig" rid="figure2">Figure 2</xref>, the periods of analysis are as follows: (1) period 1 (January 1-February 20): dominance of BA.1 and BA.1.1, (2) period 2 (February 20-June 12): BA.2 dominance, (3) period 3 (June 12-December 1): BA.5 dominance, and (4) period 4 (December 1-12): BQ1 and XBB dominance. The weekly average of daily symptom severity is the calculated number of tweets for each symptom as a proportion of tweets for all symptoms. Gray shaded area: weekly confirmed cases from the WHO. To match the 2 values of the vertical axis (weekly average daily), we performed vertical axis matching to display the image.</p><p>The confirmed cases (<xref ref-type="fig" rid="figure2">Figure 2</xref>, gray shaded area) increased only in the first 2 weeks during period 1 and then continued to decrease because this period was in the later stages of the dominance of the BA.1 and BA.1.1 subvariants. Restrictions on travel and activities and vaccination measures were implemented as early as November-December 2021. Correspondingly, the tweets related to all symptoms demonstrated a decreasing trend with little difference among them.</p><p>During period 2, the BA.2 subvariant emerged as the dominant strain and superseded BA.1 and BA.1.1. Although the increased transmissibility of BA.2 [<xref ref-type="bibr" rid="ref24">24</xref>] contributed to a second peak in confirmed cases, the risk of reinfection with BA.2 was lower [<xref ref-type="bibr" rid="ref24">24</xref>], and the severity did not escalate compared to earlier periods. Consequently, there were some slight fluctuations in Twitter discussions. At the same time, tweets related to sore throat, fever, and headache began to dominate during this period.</p><p>By mid-2022, in period 3, the symptom surveillance data showed a peak that corresponds to a surge in new cases in the real world, particularly in terms of fever, throat discomfort, and headache. Tweets related to other symptoms also exhibited relatively elevated peaks compared to their baseline levels. During this period, the BA.5 subvariant swiftly supplanted BA.2 as the predominant strain. Notably, BA.5 was characterized by enhanced immunity and heightened transmissibility [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref28">28</xref>].</p><p>Some research indicates that individuals infected with the BA.5 subvariant are more prone to experiencing several common symptoms that we have selected [<xref ref-type="bibr" rid="ref29">29</xref>], which reinforces the robustness of our analysis. Heightened public sensitivity on social media outpaced the actual occurrence of the disease and may have been influenced by sore throats becoming a primary symptom and growing awareness of the Omicron subvariants. The dynamic interplay between subvariant characteristics and public discourse is evident.</p><p>In period 4, the BQ1 subvariant dominated, which was accompanied by the emergence of XBB. Research indicates that BQ.1 and XBB have higher effective reproduction numbers [<xref ref-type="bibr" rid="ref30">30</xref>] and transmissibility compared to BA.2 and BA.5 [<xref ref-type="bibr" rid="ref31">31</xref>]. A peak of newly reported cases in December 2022 occurred in the week of December 5-11 and reached its highest point in the week of December 19-25. The Twitter data promptly revealed this conspicuous peak, and the top 3 most discussed symptoms were more sensitive.</p></sec><sec id="s3-2"><title>Sentiment Analysis of Tweets Related to COVID-19 Symptoms From 2022</title><p>Among the 8 subvariants, BA.1, BA.1.1, BA.2, BA.5, and BQ.1 notably dominated at various points during 2022. At the beginning of the year, BA.1 had already started to be gradually replaced by BA.1.1, but BA.2 quickly emerged and maintained a proportion greater than 50% for an extended period of 16 weeks. Subsequently, BA.5 began to replace BA.2 as the dominant subvariant, sustaining a proportion greater than 50% for an even longer duration of 20 weeks. By the end of the year, BQ.1 surpassed BA.5, while XBB also emerged.</p><p>Negative discussions about fever rose to nearly 40% at the beginning of the year and subsequently exhibited 2 distinct peaks during the periods when BA.2 and BA.5 were absolutely dominant, respectively. The prompt public response to the symptom of fever during the early stages of subvariant evolution may be attributed to its role as the first symptom to manifest after infection with COVID-19 [<xref ref-type="bibr" rid="ref32">32</xref>].</p><p>One characteristic of the Omicron subvariants is that the majority of symptoms closely resemble those of the cold, including headaches and sore throat [<xref ref-type="bibr" rid="ref33">33</xref>]. This is illustrated in <xref ref-type="fig" rid="figure3">Figure 3</xref>, where these 2 symptoms exhibit the highest levels of negative sentiment.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Specific symptom sentiment analysis with proportions of Omicron subvariants. The weekly negative rate is the calculated number of negative tweets for each symptom as a proportion of all tweets for the specific symptom. The evolution of the proportions of Omicron subvariants was determined based on the data on Omicron subvariant proportions from World Health Organization weekly reports.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e66237_fig03.png"/></fig></sec><sec id="s3-3"><title>Joinpoint Regression of the Number of Negative Tweets of COVID-19 Symptoms From 2022</title><p>Cough exhibited a transient rise in negative sentiment during only the initial stages of BA.2, while negative attitudes in this regard remained consistently low and stable during other periods (<xref ref-type="fig" rid="figure4">Figure 4</xref>). Given its persistent presence as a symptom of COVID-19 throughout the pandemic, the public might have developed a relatively comprehensive understanding of both the symptom itself and its associated management strategies. This symptom typically manifests in the middle stages of the infection [<xref ref-type="bibr" rid="ref32">32</xref>], and its prevalence had already begun to decline with the Omicron variant [<xref ref-type="bibr" rid="ref33">33</xref>].</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Joinpoint regression analysis of weekly negative tweets: alignment with subvariant transition periods. Significant joinpoints, which indicate a significant change in the trend of negative tweet counts, are highlighted with the specific week in black squares. The background&#x2019;s shaded regions represent the transition periods of major SARS-CoV-2 Omicron subvariants throughout 2022.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e66237_fig04.png"/></fig><p>The joinpoint analysis revealed similar trends for diarrhea, headache, and throat-related discussions (<xref ref-type="fig" rid="figure4">Figure 4</xref>). These discussions declined as the proportion of BA.1 decreased and stabilized before BA.2 became dominant. However, only headache and throat-related negative discussions exhibited minimal fluctuations during the later phase of BA.2-BA.5.</p><p>Fever was able to capture more of the subvariants&#x2019; evolution, with negative tweets exhibiting a peak in sentiment during the later stages of each subvariant transition (<xref ref-type="fig" rid="figure4">Figure 4</xref>). Model estimates of the joinpoint regression can be seen in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s3-4"><title>An Interactive Map of Opinion Analysis and Sentiment Visualization of COVID-19 Tweets</title><p>Social media platforms have become an essential channel for people to express their views and emotions about the epidemic. We developed an interactive map demo using the United States as an example to collect Twitter data, perform sentiment analysis through NLP, and link the results to corresponding geographic locations (<xref ref-type="fig" rid="figure5">Figure 5A</xref>). Of all the data we collected, tweets containing geographic information accounted for 1.5% (1351/391,508), while negative sentiment users accounted for 0.35% (5873/391,508) of all related tweets. This demo link is available at Tableau Public [<xref ref-type="bibr" rid="ref34">34</xref>]. This system provides a visual representation that provides an intuitive understanding of attitudes and emotions toward COVID-19 across different regions in the United States. Users can click on a specific location on the map to obtain detailed information about emotions from comments about COVID-19 (<xref ref-type="fig" rid="figure5">Figure 5B</xref>).</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>(A) An interactive map of opinion analysis and sentiment visualization of COVID-19 tweets showing a sample of users with negative tweets. (B) Users can click on a specific location on the map to obtain detailed information about emotions from comments about COVID-19.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e66237_fig05.png"/></fig><p>The interactive map could deepen the understanding of people&#x2019;s opinions and emotions and provide valuable national information for decision-making, opinion management, and social intervention. In decision-making and public opinion management, analyzing the distribution of different opinions and emotional tendencies in the United States could help decision-makers better understand attitudes and opinions about COVID-19 in different places. This could help to formulate more effective policies to meet the needs of the public and improve the acceptance of policies. In terms of social intervention, interactive maps of the United States could help the government better understand the distribution of views. As a result, state governments could implement more targeted interventions, such as providing psychological support, disseminating information, and mobilizing communities to address mental health and social issues related to COVID-19.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>Our findings corroborate clinical observations that Omicron subvariants shifted symptom profiles toward cold-like manifestations (eg, sore throat and headache), consistent with reports by Menni et al [<xref ref-type="bibr" rid="ref21">21</xref>] and Schulze et al [<xref ref-type="bibr" rid="ref22">22</xref>]. The heightened negative sentiment around headache and sore throat (<xref ref-type="fig" rid="figure3">Figure 3</xref>) likely reflects their unexpected prevalence during Omicron, contrasting with earlier variants. Notably, fever-related negativity proved uniquely sensitive to subvariant evolution, exhibiting dual peaks during BA.2 and BA.5 dominance. This suggests public social media reactivity may serve as a leading indicator for viral evolution&#x2014;a novel extension of prior infodemiology studies [eg, <xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. However, the sustained high negative sentiment toward symptoms such as headache (<xref ref-type="fig" rid="figure3">Figure 3</xref>) requires nuanced interpretation. While headache prevalence increased during Omicron acute infection [<xref ref-type="bibr" rid="ref21">21</xref>], its persistent discussion throughout 2022 may also reflect growing public awareness of Long COVID, where headache is a predominant symptom affecting most cases [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. This &#x201C;twin-demic&#x201D; context, where acute infection waves coexist with Long COVID burden, introduces complexity in attributing symptom trends solely to variant dynamics.</p><p>The real-time geographic dashboard (<xref ref-type="fig" rid="figure5">Figure 5</xref>) operationalizes a key advantage of social media surveillance: overcoming delays in conventional reporting. For instance, our system detected the December 2022 case surge 1&#x2010;2 weeks before WHO confirmation [<xref ref-type="bibr" rid="ref19">19</xref>], enabling proactive resource targeting. This addresses critical gaps identified in traditional systems, such as lags in resource allocation during BA.5&#x2019;s rapid spread [<xref ref-type="bibr" rid="ref31">31</xref>]. Furthermore, sentiment-driven resource allocation (eg, directing mental health support to regions with rising negative tweets) offers a scalable complement to clinical surveys. Our method also expands on Mackey et al&#x2019;s [<xref ref-type="bibr" rid="ref14">14</xref>] symptom detection framework by integrating sentiment as a proxy for symptom severity and subvariant impact, though future models should distinguish acute versus chronic symptom manifestations through keyword filtering (eg, &#x201C;long-hauler&#x201D; and &#x201C;post-COVID&#x201D;) or duration-based classification.</p><p>Our study has 4 key limitations. First, the exclusive reliance on 2022 English-language tweets introduces demographic and linguistic biases, as Twitter users skew toward younger, urban, technologically adept populations. This limits generalizability to non-English speakers, older adults, and rural communities. Future work must integrate multilingual platforms (eg, Weibo and Facebook) and extend temporal coverage to strengthen model robustness. Second, clinical generalizability is constrained by the underrepresentation of pediatric populations. While children exhibit distinct Omicron symptom severity [<xref ref-type="bibr" rid="ref10">10</xref>], our adult-dominated dataset cannot capture this nuance. Subpopulation-specific analyses require complementary clinical data.</p><p>Third, geographic sparsity remains a challenge: only 1.5% (1351/391,508) of tweets contained usable location data, and inferred geodata may introduce biases. Resource allocation based solely on these sparse signals risks misprioritization. Cross-validation with electronic health records and refined geolocation inference algorithms is essential. Fourth, global representativity is compromised by overlapping biases in Twitter data (overrepresenting Anglophone nations) and WHO variant surveillance (skewed toward high-income countries). The observed correlations between sentiment and subvariants may reflect region-specific epidemiological patterns rather than global dynamics. Future research must prioritize intentional sampling from underrepresented regions and multiplatform data fusion to validate cross-cultural applicability. In addition, our analysis did not explicitly account for Long COVID&#x2013;related symptom reporting. Given that 2022 marked a peak in Long COVID cases (WHO COVID-19 Weekly Epidemiological Update, July 2022), symptom discussions, particularly for neurological manifestations like headache, likely conflated acute infection and chronic sequelae. This conflation may partially explain the sustained high negative sentiment for certain symptoms beyond variant transition periods (eg, headache negativity remained &#x003E;30% during BA.5 decline in <xref ref-type="fig" rid="figure3">Figure 3</xref>).</p><p>Beyond COVID-19, this study establishes a scalable framework for infodemiology-driven pandemic response. The integration of real-time social media analytics with conventional surveillance creates a synergistic system capable of (1) accelerating outbreak detection (eg, leveraging symptom sentiment as an early-warning signal), (2) optimizing precision public health interventions (eg, dynamic resource allocation based on geotagged emotional hotspots), and (3) enabling rapid evaluation of policy impacts (eg, monitoring sentiment shifts postvaccine rollout). As novel pathogens emerge, such systems could mitigate the &#x201C;infodemic&#x201D; paradox, where data abundance coexists with decision-making delays, by converting public discourse into actionable intelligence. Future iterations will expand linguistic parameters, incorporate clinical correlates, and develop predictive algorithms to establish a global public health intelligence platform, ultimately bridging the gap between digital epidemiology and frontline response. The framework&#x2019;s adaptability is particularly valuable for diseases with long-term sequelae (eg, Long COVID), where real-time tracking of chronic symptoms through social discourse could accelerate therapeutic development and patient support.</p></sec><sec id="s4-2"><title>Conclusions</title><p>In summary, our method allows rapid surveillance of changes in the geographical COVID-19 symptoms. This was accomplished using sentiment analysis of tweets from people who have been infected with COVID-19 to detect the geographical severity rate. At the individual level, it can detect the real-time severity of COVID-19 and could make it possible to provide medical and mental assistance. It also provides a new solution for coping with the urgent emergence of a new pandemic.</p></sec></sec></body><back><ack><p>The authors thank the individuals who participated in data collection and validation in this paper. We used artificial intelligence tools only for language polishing and grammar checking.</p></ack><notes><sec><title>Data Availability</title><p>The datasets and code generated or analyzed during the study are available from the corresponding author (WM) on reasonable request. The data will be shared for noncommercial purposes after being fully anonymized.</p></sec></notes><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">CDC</term><def><p>Centers for Disease Control and Prevention</p></def></def-item><def-item><term id="abb2">NLP</term><def><p>natural language processing</p></def></def-item><def-item><term id="abb3">WHO</term><def><p>World Health Organization</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chan</surname><given-names>EH</given-names> </name><name name-style="western"><surname>Brewer</surname><given-names>TF</given-names> </name><name name-style="western"><surname>Madoff</surname><given-names>LC</given-names> </name><etal/></person-group><article-title>Global capacity for emerging infectious disease detection</article-title><source>Proc Natl Acad Sci USA</source><year>2010</year><month>12</month><day>14</day><volume>107</volume><issue>50</issue><fpage>21701</fpage><lpage>21706</lpage><pub-id pub-id-type="doi">10.1073/pnas.1006219107</pub-id><pub-id pub-id-type="medline">21115835</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Velasco</surname><given-names>E</given-names> </name><name name-style="western"><surname>Agheneza</surname><given-names>T</given-names> </name><name name-style="western"><surname>Denecke</surname><given-names>K</given-names> </name><name name-style="western"><surname>Kirchner</surname><given-names>G</given-names> </name><name name-style="western"><surname>Eckmanns</surname><given-names>T</given-names> </name></person-group><article-title>Social media and internet-based data in global systems for public health surveillance: a systematic review</article-title><source>Milbank Q</source><year>2014</year><month>03</month><volume>92</volume><issue>1</issue><fpage>7</fpage><lpage>33</lpage><pub-id pub-id-type="doi">10.1111/1468-0009.12038</pub-id><pub-id pub-id-type="medline">24597553</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="web"><article-title>Strengthening surveillance of and response to foodborne diseases: a practical manual. Stage 2: strengthening indicator-based surveillance</article-title><source>World Health Organization</source><year>2017</year><access-date>2025-08-30</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/publications/i/item/9789241513258">https://www.who.int/publications/i/item/9789241513258</ext-link></comment></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brownstein</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Freifeld</surname><given-names>CC</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>EH</given-names> </name><etal/></person-group><article-title>Information technology and global surveillance of cases of 2009 H1N1 influenza</article-title><source>N Engl J Med</source><year>2010</year><month>05</month><day>6</day><volume>362</volume><issue>18</issue><fpage>1731</fpage><lpage>1735</lpage><pub-id pub-id-type="doi">10.1056/NEJMsr1002707</pub-id><pub-id pub-id-type="medline">20445186</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chunara</surname><given-names>R</given-names> </name><name name-style="western"><surname>Andrews</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Brownstein</surname><given-names>JS</given-names> </name></person-group><article-title>Social and news media enable estimation of epidemiological patterns early in the 2010 Haitian cholera outbreak</article-title><source>Am J Trop Med Hyg</source><year>2012</year><month>01</month><volume>86</volume><issue>1</issue><fpage>39</fpage><lpage>45</lpage><pub-id pub-id-type="doi">10.4269/ajtmh.2012.11-0597</pub-id><pub-id pub-id-type="medline">22232449</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Gomide</surname><given-names>J</given-names> </name><name name-style="western"><surname>Veloso</surname><given-names>A</given-names> </name><name name-style="western"><surname>Meira</surname><given-names>W</given-names> </name><etal/></person-group><article-title>Dengue surveillance based on a computational model of spatio-temporal locality of Twitter</article-title><access-date>2025-07-23</access-date><conf-name>WebSci &#x2019;11</conf-name><conf-date>Jun 15-17, 2011</conf-date><conf-loc>Koblenz, Germany</conf-loc><comment><ext-link ext-link-type="uri" xlink:href="https://dl.acm.org/doi/proceedings/10.1145/2527031">https://dl.acm.org/doi/proceedings/10.1145/2527031</ext-link></comment><pub-id pub-id-type="doi">10.1145/2527031.2527049</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nsoesie</surname><given-names>EO</given-names> </name><name name-style="western"><surname>Flor</surname><given-names>L</given-names> </name><name name-style="western"><surname>Hawkins</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Social media as a sentinel for disease surveillance: what does sociodemographic status have to do with it?</article-title><source>PLoS Curr</source><year>2016</year><month>12</month><day>7</day><volume>8</volume><fpage>ecurrents.outbreaks.cc09a42586e16dc7dd62813b7ee5d6b6</fpage><pub-id pub-id-type="doi">10.1371/currents.outbreaks.cc09a42586e16dc7dd62813b7ee5d6b6</pub-id><pub-id pub-id-type="medline">28123858</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Odlum</surname><given-names>M</given-names> </name><name name-style="western"><surname>Yoon</surname><given-names>S</given-names> </name></person-group><article-title>What can we learn about the Ebola outbreak from tweets?</article-title><source>Am J Infect Control</source><year>2015</year><month>06</month><volume>43</volume><issue>6</issue><fpage>563</fpage><lpage>571</lpage><pub-id pub-id-type="doi">10.1016/j.ajic.2015.02.023</pub-id><pub-id pub-id-type="medline">26042846</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shin</surname><given-names>SY</given-names> </name><name name-style="western"><surname>Seo</surname><given-names>DW</given-names> </name><name name-style="western"><surname>An</surname><given-names>J</given-names> </name><etal/></person-group><article-title>High correlation of Middle East respiratory syndrome spread with Google search and Twitter trends in Korea</article-title><source>Sci Rep</source><year>2016</year><month>09</month><day>6</day><volume>6</volume><issue>1</issue><fpage>32920</fpage><pub-id pub-id-type="doi">10.1038/srep32920</pub-id><pub-id pub-id-type="medline">27595921</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McGough</surname><given-names>SF</given-names> </name><name name-style="western"><surname>Brownstein</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Hawkins</surname><given-names>JB</given-names> </name><name name-style="western"><surname>Santillana</surname><given-names>M</given-names> </name></person-group><article-title>Forecasting Zika incidence in the 2016 Latin America outbreak combining traditional disease surveillance with search, social media, and news report data</article-title><source>PLoS Negl Trop Dis</source><year>2017</year><month>01</month><volume>11</volume><issue>1</issue><fpage>e0005295</fpage><pub-id pub-id-type="doi">10.1371/journal.pntd.0005295</pub-id><pub-id pub-id-type="medline">28085877</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jeon</surname><given-names>J</given-names> </name><name name-style="western"><surname>Baruah</surname><given-names>G</given-names> </name><name name-style="western"><surname>Sarabadani</surname><given-names>S</given-names> </name><name name-style="western"><surname>Palanica</surname><given-names>A</given-names> </name></person-group><article-title>Identification of risk factors and symptoms of COVID-19: analysis of biomedical literature and social media data</article-title><source>J Med Internet Res</source><year>2020</year><month>10</month><day>2</day><volume>22</volume><issue>10</issue><fpage>e20509</fpage><pub-id pub-id-type="doi">10.2196/20509</pub-id><pub-id pub-id-type="medline">32936770</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Oyebode</surname><given-names>O</given-names> </name><name name-style="western"><surname>Ndulue</surname><given-names>C</given-names> </name><name name-style="western"><surname>Adib</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Health, psychosocial, and social issues emanating from the COVID-19 pandemic based on social media comments: text mining and thematic analysis approach</article-title><source>JMIR Med Inform</source><year>2021</year><month>04</month><day>6</day><volume>9</volume><issue>4</issue><fpage>e22734</fpage><pub-id pub-id-type="doi">10.2196/22734</pub-id><pub-id pub-id-type="medline">33684052</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Medford</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Saleh</surname><given-names>SN</given-names> </name><name name-style="western"><surname>Sumarsono</surname><given-names>A</given-names> </name><name name-style="western"><surname>Perl</surname><given-names>TM</given-names> </name><name name-style="western"><surname>Lehmann</surname><given-names>CU</given-names> </name></person-group><article-title>An &#x201C;infodemic&#x201D;: leveraging high-volume Twitter data to understand early public sentiment for the coronavirus disease 2019 outbreak</article-title><source>Open Forum Infect Dis</source><year>2020</year><month>07</month><volume>7</volume><issue>7</issue><fpage>ofaa258</fpage><pub-id pub-id-type="doi">10.1093/ofid/ofaa258</pub-id><pub-id pub-id-type="medline">33117854</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mackey</surname><given-names>T</given-names> </name><name name-style="western"><surname>Purushothaman</surname><given-names>V</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Machine learning to detect self-reporting of symptoms, testing access, and recovery associated with COVID-19 on Twitter: retrospective big data infoveillance study</article-title><source>JMIR Public Health Surveill</source><year>2020</year><month>06</month><day>8</day><volume>6</volume><issue>2</issue><fpage>e19509</fpage><pub-id pub-id-type="doi">10.2196/19509</pub-id><pub-id pub-id-type="medline">32490846</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nemes</surname><given-names>L</given-names> </name><name name-style="western"><surname>Kiss</surname><given-names>A</given-names> </name></person-group><article-title>Social media sentiment analysis based on COVID-19</article-title><source>J Inform Telecommun</source><year>2021</year><month>01</month><day>2</day><volume>5</volume><issue>1</issue><fpage>1</fpage><lpage>15</lpage><pub-id pub-id-type="doi">10.1080/24751839.2020.1790793</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wu</surname><given-names>J</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Hua</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Trend and co-occurrence network of COVID-19 symptoms from large-scale social media data: infoveillance study</article-title><source>J Med Internet Res</source><year>2023</year><month>03</month><day>14</day><volume>25</volume><fpage>e45419</fpage><pub-id pub-id-type="doi">10.2196/45419</pub-id><pub-id pub-id-type="medline">36812402</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thakur</surname><given-names>N</given-names> </name><name name-style="western"><surname>Han</surname><given-names>CY</given-names> </name></person-group><article-title>An exploratory study of tweets about the SARS-CoV-2 Omicron Variant: insights from sentiment analysis, language interpretation, source tracking, type classification, and embedded URL detection</article-title><source>COVID</source><year>2022</year><volume>2</volume><issue>8</issue><fpage>1026</fpage><lpage>1049</lpage><pub-id pub-id-type="doi">10.3390/covid2080076</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Crawley</surname><given-names>AW</given-names> </name><name name-style="western"><surname>Divi</surname><given-names>N</given-names> </name><name name-style="western"><surname>Smolinski</surname><given-names>MS</given-names> </name></person-group><article-title>Using timeliness metrics to track progress and identify gaps in disease surveillance</article-title><source>Health Secur</source><year>2021</year><volume>19</volume><issue>3</issue><fpage>309</fpage><lpage>317</lpage><pub-id pub-id-type="doi">10.1089/hs.2020.0139</pub-id><pub-id pub-id-type="medline">33891487</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="web"><article-title>Symptoms of COVID-19</article-title><source>Centers for Disease Control and Prevention</source><year>2022</year><month>10</month><day>26</day><access-date>2025-07-23</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.cdc.gov/coronavirus/2019-ncov/symptoms-testing/symptoms.html">https://www.cdc.gov/coronavirus/2019-ncov/symptoms-testing/symptoms.html</ext-link></comment></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="web"><article-title>RoBERTa base model</article-title><source>Hugging Face</source><access-date>2025-07-23</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://huggingface.co/FacebookAI/roberta-base">https://huggingface.co/FacebookAI/roberta-base</ext-link></comment></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Menni</surname><given-names>C</given-names> </name><name name-style="western"><surname>Valdes</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Polidori</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Symptom prevalence, duration, and risk of hospital admission in individuals infected with SARS-CoV-2 during periods of omicron and delta variant dominance: a prospective observational study from the ZOE COVID study</article-title><source>Lancet</source><year>2022</year><month>04</month><day>23</day><volume>399</volume><issue>10335</issue><fpage>1618</fpage><lpage>1624</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(22)00327-0</pub-id><pub-id pub-id-type="medline">35397851</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schulze</surname><given-names>H</given-names> </name><name name-style="western"><surname>Bayer</surname><given-names>W</given-names> </name></person-group><article-title>Changes in symptoms experienced by SARS-CoV-2-infected individuals &#x2013; from the first wave to the Omicron Variant</article-title><source>Front Virol</source><year>2022</year><volume>2</volume><pub-id pub-id-type="doi">10.3389/fviro.2022.880707</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Iacobucci</surname><given-names>G</given-names> </name></person-group><article-title>Covid-19: UK adds sore throat, headache, fatigue, and six other symptoms to official list</article-title><source>BMJ</source><year>2022</year><month>04</month><day>4</day><volume>377</volume><fpage>o892</fpage><pub-id pub-id-type="doi">10.1136/bmj.o892</pub-id><pub-id pub-id-type="medline">35379691</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="report"><article-title>Weekly epidemiological update on COVID-19</article-title><year>2022</year><month>06</month><day>22</day><access-date>2025-07-23</access-date><publisher-name>World Health Organization</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/emergencies/diseases/novel-coronavirus-2019/situation-reports">https://www.who.int/emergencies/diseases/novel-coronavirus-2019/situation-reports</ext-link></comment></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tuekprakhon</surname><given-names>A</given-names> </name><name name-style="western"><surname>Nutalai</surname><given-names>R</given-names> </name><name name-style="western"><surname>Dijokaite-Guraliuc</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Antibody escape of SARS-CoV-2 Omicron BA.4 and BA.5 from vaccine and BA.1 serum</article-title><source>Cell</source><year>2022</year><month>07</month><day>7</day><volume>185</volume><issue>14</issue><fpage>2422</fpage><lpage>2433</lpage><pub-id pub-id-type="doi">10.1016/j.cell.2022.06.005</pub-id><pub-id pub-id-type="medline">35772405</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hachmann</surname><given-names>NP</given-names> </name><name name-style="western"><surname>Miller</surname><given-names>J</given-names> </name><name name-style="western"><surname>Collier</surname><given-names>ARY</given-names> </name><etal/></person-group><article-title>Neutralization escape by SARS-CoV-2 Omicron subvariants BA.2.12.1, BA.4, and BA.5</article-title><source>N Engl J Med</source><year>2022</year><month>07</month><day>7</day><volume>387</volume><issue>1</issue><fpage>86</fpage><lpage>88</lpage><pub-id pub-id-type="doi">10.1056/NEJMc2206576</pub-id><pub-id pub-id-type="medline">35731894</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shrestha</surname><given-names>LB</given-names> </name><name name-style="western"><surname>Foster</surname><given-names>C</given-names> </name><name name-style="western"><surname>Rawlinson</surname><given-names>W</given-names> </name><name name-style="western"><surname>Tedla</surname><given-names>N</given-names> </name><name name-style="western"><surname>Bull</surname><given-names>RA</given-names> </name></person-group><article-title>Evolution of the SARS-CoV-2 omicron variants BA.1 to BA.5: implications for immune escape and transmission</article-title><source>Rev Med Virol</source><year>2022</year><month>09</month><volume>32</volume><issue>5</issue><fpage>e2381</fpage><pub-id pub-id-type="doi">10.1002/rmv.2381</pub-id><pub-id pub-id-type="medline">35856385</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kang</surname><given-names>SW</given-names> </name><name name-style="western"><surname>Park</surname><given-names>H</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>JY</given-names> </name><etal/></person-group><article-title>Comparison of the clinical and virological characteristics of SARS-CoV-2 Omicron BA.1/BA.2 and omicron BA.5 variants: a prospective cohort study</article-title><source>J Infect</source><year>2023</year><month>05</month><volume>86</volume><issue>5</issue><fpage>e148</fpage><lpage>e151</lpage><pub-id pub-id-type="doi">10.1016/j.jinf.2023.01.015</pub-id><pub-id pub-id-type="medline">36669564</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Goller</surname><given-names>KV</given-names> </name><name name-style="western"><surname>Moritz</surname><given-names>J</given-names> </name><name name-style="western"><surname>Ziemann</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Differences in clinical presentations of Omicron infections with the Lineages BA.2 and BA.5 in Mecklenburg-Western Pomerania, Germany, between April and July 2022</article-title><source>Viruses</source><year>2022</year><month>09</month><day>13</day><volume>14</volume><issue>9</issue><fpage>2033</fpage><pub-id pub-id-type="doi">10.3390/v14092033</pub-id><pub-id pub-id-type="medline">36146837</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tamura</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ito</surname><given-names>J</given-names> </name><name name-style="western"><surname>Uriu</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Virological characteristics of the SARS-CoV-2 XBB variant derived from recombination of two Omicron subvariants</article-title><source>Nat Commun</source><year>2023</year><month>05</month><day>16</day><volume>14</volume><issue>1</issue><fpage>2800</fpage><pub-id pub-id-type="doi">10.1038/s41467-023-38435-3</pub-id><pub-id pub-id-type="medline">37193706</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kimura</surname><given-names>I</given-names> </name><name name-style="western"><surname>Yamasoba</surname><given-names>D</given-names> </name><name name-style="western"><surname>Tamura</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Virological characteristics of the SARS-CoV-2 Omicron BA.2 subvariants, including BA.4 and BA.5</article-title><source>Cell</source><year>2022</year><month>10</month><day>13</day><volume>185</volume><issue>21</issue><fpage>3992</fpage><lpage>4007</lpage><pub-id pub-id-type="doi">10.1016/j.cell.2022.09.018</pub-id><pub-id pub-id-type="medline">36198317</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Larsen</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Martin</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Martin</surname><given-names>JD</given-names> </name><name name-style="western"><surname>Kuhn</surname><given-names>P</given-names> </name><name name-style="western"><surname>Hicks</surname><given-names>JB</given-names> </name></person-group><article-title>Modeling the onset of symptoms of COVID-19</article-title><source>Front Public Health</source><year>2020</year><volume>8</volume><fpage>473</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2020.00473</pub-id><pub-id pub-id-type="medline">32903584</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="web"><article-title>Londoners with cold symptoms more likely to have Covid, says expert</article-title><source>The Guardian</source><year>2021</year><access-date>2025-08-30</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.theguardian.com/world/2021/dec/15/londoners-with-cold-symptoms-more-likely-to-have-covid-expert-omicron">https://www.theguardian.com/world/2021/dec/15/londoners-with-cold-symptoms-more-likely-to-have-covid-expert-omicron</ext-link></comment></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="web"><article-title>Location&#x0026;description</article-title><source>Tableau Public</source><access-date>2025-09-02</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://public.tableau.com/app/profile/sia7698/viz/Locationdescription/Sheet8">https://public.tableau.com/app/profile/sia7698/viz/Locationdescription/Sheet8</ext-link></comment></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tana</surname><given-names>C</given-names> </name><name name-style="western"><surname>Bentivegna</surname><given-names>E</given-names> </name><name name-style="western"><surname>Cho</surname><given-names>SJ</given-names> </name><etal/></person-group><article-title>Long COVID headache</article-title><source>J Headache Pain</source><year>2022</year><month>08</month><day>1</day><volume>23</volume><issue>1</issue><fpage>93</fpage><pub-id pub-id-type="doi">10.1186/s10194-022-01450-8</pub-id><pub-id pub-id-type="medline">35915417</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>G&#x00F3;mez-Dab&#x00F3;</surname><given-names>L</given-names> </name><name name-style="western"><surname>Melgarejo-Mart&#x00ED;nez</surname><given-names>L</given-names> </name><name name-style="western"><surname>Caronna</surname><given-names>E</given-names> </name><name name-style="western"><surname>Pozo-Rosich</surname><given-names>P</given-names> </name></person-group><article-title>Headache in COVID-19 and Long COVID: to know facts for clinical practice</article-title><source>Curr Neurol Neurosci Rep</source><year>2023</year><month>10</month><volume>23</volume><issue>10</issue><fpage>551</fpage><lpage>560</lpage><pub-id pub-id-type="doi">10.1007/s11910-023-01296-w</pub-id><pub-id pub-id-type="medline">37665495</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Model estimates of joinpoint regression.</p><media xlink:href="formative_v9i1e66237_app1.pdf" xlink:title="PDF File, 130 KB"/></supplementary-material></app-group></back></article>