<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JFR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id>
      <journal-title>JMIR Formative Research</journal-title>
      <issn pub-type="epub">2561-326X</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i1e55309</article-id>
      <article-id pub-id-type="pmid">39879094</article-id>
      <article-id pub-id-type="doi">10.2196/55309</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Understanding Health-Related Discussions on Reddit: Development of a Topic Assignment Method and Exploratory Analysis</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Mistry</surname>
            <given-names>Jinal</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Chan</surname>
            <given-names>Garrett J</given-names>
          </name>
          <degrees>MD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3660-5135</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Fung</surname>
            <given-names>Mark</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6081-4151</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Warrington</surname>
            <given-names>Jill</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2196-1789</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Nowak</surname>
            <given-names>Sarah A</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Larner College of Medicine</institution>
            <institution>University of Vermont</institution>
            <addr-line>89 Beaumont Ave</addr-line>
            <addr-line>Burlington, VT, 05405</addr-line>
            <country>United States</country>
            <phone>1 802 656 0359</phone>
            <email>sarah.nowak@med.uvm.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5965-9035</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Departments of Pathology and Laboratory Medicine</institution>
        <institution>University of California, San Francisco</institution>
        <addr-line>San Francisco, CA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Larner College of Medicine</institution>
        <institution>University of Vermont</institution>
        <addr-line>Burlington, VT</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Sarah A Nowak <email>sarah.nowak@med.uvm.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>29</day>
        <month>1</month>
        <year>2025</year>
      </pub-date>
      <volume>9</volume>
      <elocation-id>e55309</elocation-id>
      <history>
        <date date-type="received">
          <day>8</day>
          <month>12</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>26</day>
          <month>8</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>10</day>
          <month>10</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>28</day>
          <month>10</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Garrett J Chan, Mark Fung, Jill Warrington, Sarah A Nowak. Originally published in JMIR Formative Research (https://formative.jmir.org), 29.01.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on https://formative.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://formative.jmir.org/2025/1/e55309" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Social media has become a widely used way for people to share opinions about health care and medical topics. Social media data can be leveraged to understand patient concerns and provide insight into why patients may turn to the internet instead of the health care system for health advice.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to develop a method to investigate Reddit posts discussing health-related conditions. Our goal was to characterize these topics and identify trends in these social media–based medical discussions.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Using an initial query, we collected 1 year of Reddit posts containing the phrases “get tested” and “get checked.” These posts were manually reviewed, and subreddits containing irrelevant posts were excluded from analysis. This selection of posts was manually read by the investigators to categorize posts into topics. A script was developed to automatically assign topics to additional posts based on keywords. Topic and keyword selections were refined based on manual review for more accurate topic assignment. Topic assignment was then performed on the entire 1-year Reddit dataset containing 347,130 posts. Related topics were grouped into broader medical disciplines. Analysis of the topic assignments was then conducted to assess condition and medical topic frequencies in medical condition–focused subreddits and general subreddits.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We created an automated algorithm to assign medical topics to Reddit posts. By iterating through multiple rounds of topic assignment, we improved the accuracy of the algorithm. Ultimately, this algorithm created 82 topics sorted into 17 broader medical disciplines. Of all topics, sexually transmitted infections (STIs), eye disorders, anxiety, and pregnancy had the highest post frequency overall. STIs comprised 7.44% (5876/78,980) of posts, and anxiety comprised 5.43% (4289/78,980) of posts. A total of 34% (28/82) of the topics comprised 80% (63,184/78,980) of all posts. Of the medical disciplines, those with the most posts were psychiatry and mental health; genitourinary and reproductive health; infectious diseases; and endocrinology, nutrition, and metabolism. Psychiatry and mental health comprised 26.6% (21,009/78,980) of posts, and genitourinary and reproductive health comprised 13.6% (10,741/78,980) of posts. Overall, most posts were also classified under these 4 medical disciplines. During analysis, subreddits were also classified as <italic>general</italic> if they did not focus on a specific health issue and <italic>topic-specific</italic> if they discussed a specific medical issue. Topics that appeared most frequently in the top 5 in general subreddits included addiction and drug anxiety, attention-deficit/hyperactivity disorder, abuse, and STIs. In topic-specific subreddits, most posts were found to discuss the topic of that subreddit.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Certain health topics and medical disciplines are predominant on Reddit. These include topics such as STIs, eye disorders, anxiety, and pregnancy. Most posts were classified under the medical disciplines of psychiatry and mental health, as well as genitourinary and reproductive health.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>digital health</kwd>
        <kwd>internet</kwd>
        <kwd>open data</kwd>
        <kwd>social networking</kwd>
        <kwd>social media</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>With over 3.8 billion people regularly sharing information about their lives on social media platforms [<xref ref-type="bibr" rid="ref1">1</xref>], social media has become a ubiquitous part of daily life. In addition to building relationships with other people, social media helps users find information on disciplines that they are concerned about or interested in. Social media platforms have become a commonly used way to discuss problems and seek advice [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        <p>Given its prevalent use, social media content may provide insight into individual attitudes and opinions about health. The anonymous nature of certain social media platforms allows users to choose to discuss potentially embarrassing subjects without an expectation of privacy. Deidentified information can be used for research purposes to understand social behavior as it is impossible to associate a specific comment with a single person.</p>
        <p>Analysis of social media content has other strengths compared to more traditional methods such as surveys. For example, surveys may be influenced by social desirability bias, and respondents may not be as open when discussing sensitive or potentially embarrassing conditions [<xref ref-type="bibr" rid="ref5">5</xref>] such as drug use or sexually transmitted infections (STIs). Several studies have demonstrated that internet-based platforms can circumvent or mitigate this limitation. For example, as Google search history reflects an active process (seeking information) rather than stated beliefs, it may be more accurate than surveys for some stigmatized beliefs in particular [<xref ref-type="bibr" rid="ref6">6</xref>]. People have a variety of motivations for using social media, including information seeking, information sharing, and expression of opinion [<xref ref-type="bibr" rid="ref2">2</xref>]. While previous work has also shown that online content becomes more shared, or viral, when it invokes strong, activating emotions, either positive or negative [<xref ref-type="bibr" rid="ref7">7</xref>], some studies have suggested that individuals may be more honest with sharing their thoughts online.</p>
        <p>An advantage of the use of social media to learn about people’s behaviors and sentiments is that we can obtain large volumes of data in a short period and user-generated content can be processed quickly [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Social media websites count among the most trafficked ones in the United States. Facebook is the 6th most popular website in the United States at the time of writing, Reddit is the 7th, Instagram is the 18th, and Twitter (subsequently rebranded X) is the 33rd. The variety of topics discussed on social media is wide-ranging, and these topics include information about people’s health concerns as users can pose and answer questions about health-related conditions on internet forums.</p>
        <p>Reddit has over 270 million monthly users [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>] who can post first-person accounts of illness and interactions with the health care system and leave comments on other users’ posts about their experiences with similar illnesses. At the time of writing, Reddit ranks 17th in global engagement [<xref ref-type="bibr" rid="ref12">12</xref>]. In addition, 42.8% of Reddit site traffic comes from search engines rather than direct visits to the site. For comparison, only 12.4% of Twitter traffic comes from searches, which may mean that a greater proportion of visits to Reddit comes from internet users doing a general search for information rather than choosing to go to a specific website. Therefore, many internet users reach Reddit from search engines, making the site an important source of information to both Reddit users and nonusers.</p>
        <p>While the spectrum of discussion about health on social media is broad, studies of sites such as Reddit, Twitter, and Facebook have been able to examine disease- and health concern–specific discussions. This includes detection of opioid addiction based on Twitter posts [<xref ref-type="bibr" rid="ref13">13</xref>] and discussion of colorectal cancer, breast cancer, and diabetes through analysis of Twitter posts and Facebook groups [<xref ref-type="bibr" rid="ref14">14</xref>]. One study also categorized user data from Twitter posts into 4 specific disease-related topics: <italic>flu</italic>, <italic>depression</italic>, <italic>pregnancy</italic>, and <italic>eating disorders</italic> [<xref ref-type="bibr" rid="ref15">15</xref>]. Other studies on Reddit have sought to detect depression [<xref ref-type="bibr" rid="ref16">16</xref>], detect suicidality among opioid users [<xref ref-type="bibr" rid="ref17">17</xref>], and characterize weight loss discussions [<xref ref-type="bibr" rid="ref18">18</xref>]. These works have demonstrated the ability to select specific topics from social media data and draw conclusions about how these topics are encountered in the social media sphere. Multiple studies have characterized language markers to evaluate discussions on medical topics, giving each medical topic a unique pattern of markers [<xref ref-type="bibr" rid="ref19">19</xref>]. In all, each medical topic can be thought of as having a social media “gene” that conceptualizes it as having a recognizable identity on social media that can be tracked and analyzed [<xref ref-type="bibr" rid="ref20">20</xref>].</p>
        <p>The specific system architecture and features of different social media platforms make each more optimally suited for different types of studies (<xref ref-type="table" rid="table1">Table 1</xref>). For example, differences in information organization, post length, and rules for content creation can influence the analysis. The use of Reddit, for example, is well suited for evaluation of stigmatized topics and topic-based conversations. On Reddit, posts are organized into groups by topic, and users can interact through specific forums, called subreddits, to find discussions related to the subject they are interested in. A post’s visibility in a subreddit is determined by user upvotes and downvotes. In addition, posts may be removed by moderators if they violate subreddit-specific community rules [<xref ref-type="bibr" rid="ref21">21</xref>]. Therefore, subreddits are a dedicated space for people to address a topic with the expectation of pertinent discussion. Previous work has noted that the topic-based organization of Reddit content is appropriate for studying specific health topics in greater detail [<xref ref-type="bibr" rid="ref22">22</xref>]. Furthermore, some subreddits are question and answer–based. On the subreddit <italic>r/askdocs</italic>, users can seek answers about medical topics from health professionals who have been verified by subreddit moderators. While these subreddits do not coalesce around a certain topic, they allow users to ask questions to content experts anonymously, a function difficult to find on other social media platforms.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Comparison of select social media platforms by content, organization, level of anonymity, moderation, and number of articles on PubMed.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="180"/>
            <col width="280"/>
            <col width="320"/>
            <col width="220"/>
            <thead>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Reddit</td>
                <td>Twitter</td>
                <td>Facebook</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Content length</td>
                <td>40,000-character limit</td>
                <td>280-character limit</td>
                <td>No limit</td>
              </tr>
              <tr valign="top">
                <td>Content organization and sharing</td>
                <td>Users search for posts of interest; posts organized in topic-based subreddits</td>
                <td>On the basis of accounts that a user follows; users can search for common themes using hashtags</td>
                <td>Often based on real-life connections</td>
              </tr>
              <tr valign="top">
                <td>Anonymity</td>
                <td>May be completely anonymous</td>
                <td>May or may not be anonymous</td>
                <td>Real-name culture encouraged</td>
              </tr>
              <tr valign="top">
                <td>Moderation</td>
                <td>User moderated; subreddits have content guidelines</td>
                <td>Platform moderated</td>
                <td>Platform moderated</td>
              </tr>
              <tr valign="top">
                <td>PubMed articles, N</td>
                <td>277</td>
                <td>5769</td>
                <td>5030</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>Despite discussion forums such as Reddit having features that distinguish them from platforms such as Twitter and Facebook in important ways, comparatively little research has been conducted investigating health beliefs and discussions on Reddit. A number of text analysis studies on social media platforms have been conducted—at the time of writing, there are 5769 articles on PubMed discussing Twitter and 5030 about Facebook. However, only 277 articles have been published discussing Reddit [<xref ref-type="bibr" rid="ref23">23</xref>]. For an internet user searching for information on a specific subject, Reddit represents a useful starting point because of its topic-focused organization.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>We report a text analysis of health concerns and topics reflected in users’ Reddit posts during 2019. Given the previous studies on using social media to study health and medicine, we wanted to continue this work while looking at medical topics on another platform. In addition to the relative lack of study compared to other social media platforms, we chose to investigate Reddit because it has features that differentiate it from heretofore more frequently studied social media platforms: specific, topic-based discussions; greater anonymity; and user moderators. We wanted to capture posts from a variety of health-relevant subreddits discussing seeking or receiving testing and diagnostic advice.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethical Considerations</title>
        <p>The RAND Corporation was consulted regarding institutional review board approval. The RAND Human Subject Protection Committee (the RAND Institutional Review Board) determined that the project did not involve human participants as defined by the regulations of Title 45 of the Code of Federal Regulations Part 46.102(f) and, therefore, was not subject to further review. We did not explicitly obtain a waiver of informed consent; however, the determination of the absence of human participants implies a waiver of the need for documented informed consent. In addition, all data were anonymous, and obtaining informed consent would require identifying individuals, which would also be a violation of the Reddit terms of service.</p>
      </sec>
      <sec>
        <title>Overview</title>
        <p>We conducted our analysis in 4 steps (<xref rid="figure1" ref-type="fig">Figure 1</xref>) designed to balance false positives and false negatives. In step 1, we developed and refined a query to obtain posts about medical testing and advice about seeking diagnoses. In step 2, topics were created to classify the posts. Subreddits that clearly contained irrelevant posts were identified and excluded to improve the efficiency of the topic creation process. In step 3, posts assigned to the developed topics were reviewed, and the keywords used for topic assignment were refined. The process for identifying subreddits with relevant posts to be included in the analysis was refined as well. In step 4, keywords were used to do a final automatic assignment to a set of posts from a 12-month period. The 4 steps are shown in more detail in <xref rid="figure2" ref-type="fig">Figure 2</xref> and are described in the following sections.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Overview of analysis steps—the overall methodology for gathering posts, creating topics, and automatically assigning posts to topics.</p>
          </caption>
          <graphic xlink:href="formative_v9i1e55309_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Step 1: Query Creation and Refinement</title>
        <p>First, we captured posts from Reddit that were relevant to testing and diagnosis. We developed a query in Crimson Hexagon’s Monitor application programming interface to obtain posts that contained variations of the phrases “getting tested” or “getting checked out” and excluded posts from subreddits that would be unlikely to be relevant to medicine or health care (<xref rid="figure2" ref-type="fig">Figure 2</xref>A and Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The query run was as follows: “((get OR got) AND ((test AND tested)OR(check OR checked)) AND for)~4” (<xref rid="figure2" ref-type="fig">Figure 2</xref>A). Posts gathered using this query included either the words “get” or “got” in conjunction with “test,” “tested,” “check,” or “checked” appearing within 4 words of each other. The posts collected were created between January 1, 2019, and December 31, 2019, and included the text content of the post, its title, and its date. A <italic>post</italic> could be the body of text created by the original poster or a comment from a user on an original post. In both cases, the content of a post during our analysis included the title of the original post to provide additional context.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Detailed flow diagrams of analysis steps 1 to 4. (A) Step 1: selection of Reddit posts. Posts from January 1, 2019, to December 31, 2019, were considered in this study. (B) Step 2: identification of topic keywords. Topics were manually created from three 100-post samples, and keywords were assigned to each topic. (C) Step 3: topic assignment. Topics were manually assigned to additional 100-post samples based on the topic keyword file. (D) Step 4: automatic assignment of posts for analysis. The algorithm using the final topic keyword file was run on 78,980 posts chosen from the overall corpus of 347,130 posts.</p>
          </caption>
          <graphic xlink:href="formative_v9i1e55309_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>To limit our false-positive rate, we first excluded subreddits tabulated on <italic>r/listofsubreddits</italic> (accessed November 18, 2019) that would be most irrelevant to health-related discussions (Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Posts not from these subreddits were included in the topic creation step.</p>
      </sec>
      <sec>
        <title>Step 2: Topic Creation</title>
        <p>In this step, we manually read through 100 posts and labeled each with a de novo topic (<xref rid="figure2" ref-type="fig">Figure 2</xref>B). Topic creation was guided by the existing taxonomy in the <italic>International Classification of Diseases, 10th Revision</italic> (<italic>ICD-10</italic>) [<xref ref-type="bibr" rid="ref24">24</xref>]. Topics were sorted into medical disciplines to optimize the analysis by clustering topics into larger groups.</p>
        <p>These disciplines corresponded to chapter titles in the <italic>ICD-10</italic>. We then designated keywords that corresponded to each of these topics. For example, for the topic of STIs, keywords included “antibiotics,” “gonorrhea,” “chlamydia,” and “bacterial vaginosis.” Additional keywords were chosen from the corresponding article topic on UpToDate (Wolters Kluwer N.V.) [<xref ref-type="bibr" rid="ref25">25</xref>], a reference for health care providers covering the diagnosis, pathophysiology, and treatment of a broad spectrum of medical conditions. In addition, several topics related to the health care system but not to a disease or topic were created, such as medical billing. Finally, for posts that did not fit with any of the aforementioned topics, a <italic>nonmedical</italic> topic was devised. Posts that corresponded to an existing topic were assigned to that topic.</p>
        <p>The topics and disciplines that we formulated corresponded to the diagnoses and chapters in the <italic>ICD-10</italic>. A list of topics with their corresponding category is available in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. This categorization system is similar to the categorization of diseases and topics that health care providers follow. Therefore, our topics and medical disciplines were validated by an existing and accepted hierarchy of disease classification. We chose to use the <italic>ICD-10</italic> over other controlled vocabulary systems such as the Medical Subject Headings thesaurus of the National Library of Medicine and the Logical Observation Identifiers Names and Codes database because the <italic>ICD-10</italic> is the system that most physicians are in contact with and is the most targeted at covering the diagnosis of diseases. In contrast, the Medical Subject Headings thesaurus is a broader system for indexing publications that encompasses anatomy, organisms, and drugs, among many other topics.</p>
        <p>During this process, additional irrelevant subreddits and terms were excluded from the query. In total, 3 iterations of keyword selection, each performed on a 100-post set, were completed. This generated our initial topic keyword file.</p>
      </sec>
      <sec>
        <title>Step 3: Topic Refinement and Determination of False-Positive Rate as Means of Validating Topic Assignment</title>
        <p>To begin automatically assigning topics to posts (<xref rid="figure2" ref-type="fig">Figure 2</xref>C), we created a script in R (R Foundation for Statistical Computing) that first put each post into tidy format using the <italic>tidyverse</italic> package [<xref ref-type="bibr" rid="ref26">26</xref>]. The script then assigned a single topic to each post based on words found in the post and on the keyword file. With further manual analyses of more posts, we added more keywords to each topic with the goal of improving future topic assignment in later iterations.</p>
        <p>We read through 100-post samples to add additional keywords to topics. After each run, we manually validated the accuracy of the topic assignments and iterated through this review process for 15 runs. Our topic assignments were reviewed by SAN and GC. Keyword classifications were reviewed by SAN and GC, as well as by MF and JW, 2 clinical pathologists. Accuracy was determined by reading the title and content of the posts and determining whether the topic captured the essence of the post. Topic assignment was designated as either correct or incorrect. We maintained objectivity by blinding the topic reviewer to each post’s topic as assigned by the script before manually assigning a topic to that post. An example of a post and its assigned topic is as follows:</p>
        <disp-quote>
          <p>POST: I find that when I go through bouts of anxiety the mornings are usually the hardest, no appetite, tired etc, but as the day goes on I find I feel better, even to the extent by evening time I feel “normal.”</p>
        </disp-quote>
        <disp-quote>
          <p>ASSIGNED TOPIC: Anxiety</p>
        </disp-quote>
        <p>We then determined how many posts’ topics had been correctly assigned per run and calculated an accuracy rate. During this process, we improved our script by allowing multi-word keywords and lemmatizing keywords. In addition, more subreddits were excluded to improve accuracy (Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
        <p>In addition, our algorithm excluded irrelevant posts based on irrelevant terms and subreddits determined in step 2. During the manual review process, we reviewed which posts were determined to be irrelevant by the algorithm to determine the accuracy and efficacy of using those exclusion methods [<xref ref-type="bibr" rid="ref27">27</xref>-<xref ref-type="bibr" rid="ref29">29</xref>]. Then, in each iteration, we calculated the false-positive rate, defined as the number of relevant posts divided by the total number of posts subtracted from 1 [<xref ref-type="bibr" rid="ref30">30</xref>].</p>
        <p>Posts were defined as relevant to health care if the main subject of the post related to seeking a diagnosis for a medical condition, discussion of treatment and management of a medical condition, or medical billing. An example of such a post is as follows:</p>
        <disp-quote>
          <p>Licensed skincare practitioner here. Get it checked. SKs [seborrheic keratoses] can itch and flake. Also may be BCC.</p>
        </disp-quote>
        <p>An example of an irrelevant post is as follows:</p>
        <disp-quote>
          <p>Him going around checking if his wife cleaned properly is not something that should be rationalised....</p>
        </disp-quote>
      </sec>
      <sec>
        <title>Step 4: Analysis of Reddit Data From January 1, 2019, to December 31, 2019, and Subreddit Analysis</title>
        <p>To restrict our final analysis to posts mostly likely to be relevant to health-related discussion, we further limited the posts in the final analysis to those from certain subreddits. We specifically selected the 77 health-related subreddits posted on <italic>r/listofsubreddits</italic> and manually read through these subreddits to check for relevance to health discussions. In addition, we chose 10 subreddits with the most posts from our data sample to gather a broad range of Reddit discussion and another 8 health-related subreddits not posted on <italic>r/listofsubreddits</italic> that we determined contained relevant posts. In total, we obtained 95 subreddits.</p>
        <p>We used the topic keyword file to automatically assign topics and medical disciplines to the set of Reddit posts that matched the query described previously (<xref rid="figure2" ref-type="fig">Figure 2</xref>D). Of note, we found that only posts from 89% (85/95) of the subreddits were assigned to a topic, indicating that the other 10 subreddits did not contain any health-related discussion as determined by the algorithm. We manually read through 300 posts to determine the accuracy rate. The topic assignments then underwent further analysis to determine the distribution of topics and medical disciplines, distribution of posts in subreddits, and distribution of topics in each subreddit. Finally, we selected quotes from our quantitative results to provide human-relatable insights that illustrated what was discussed in each discipline, as previously done in other social media–mining research [<xref ref-type="bibr" rid="ref27">27</xref>,<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Step 1: Determination of Relevant Posts, Subreddit Limitation, and Query Refinement</title>
        <p>In total, 347,130 posts from January 1, 2019, to December 31, 2019, were downloaded from Reddit. Of those 347,130 posts, 109,653 (31.59%) belonged to subreddits that were determined to be irrelevant, and 237,477 (68.41%) came from relevant subreddits. Irrelevant subreddits were found to be those pertaining to games, popular media, and technology (Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
        <p>In step 1 (<xref rid="figure2" ref-type="fig">Figure 2</xref>A), the exclusion of irrelevant subreddits from our query decreased the false-positive rate of irrelevant posts from 59% to 29% (calculated from a random sample of 100 posts). We did not attempt to further decrease the false-positive rate in this step to avoid overexcluding subreddits and posts in the manual review step.</p>
      </sec>
      <sec>
        <title>Steps 2 and 3: Topic Creation and Validation</title>
        <p>A total of 82 topics were created through the inductive workflow outlined previously and sorted into 17 medical disciplines. Each topic was assigned to only 1 medical discipline. We validated our choices of topics and medical disciplines by comparing these categorizations to the diseases and medical topics delineated in the <italic>ICD-10</italic>. Of the 82 topics we created, 80 (98%) had a corresponding topic in the <italic>ICD-10</italic>; the exceptions were the <italic>medical billing</italic> and <italic>nonmedical</italic> topics. The accuracy of the topic assignments in this step was 56.3% (SD 4.92%; SEM 4.62%).</p>
      </sec>
      <sec>
        <title>Step 4: Topics and Medical Disciplines</title>
        <p>In step 4, subreddits to include in the final analysis were identified. While our objective in step 1 was to reduce the false-positive rate without being too restrictive (eliminating only subreddits least likely to contain medical discussion), our objective in this step was to keep only subreddits most likely to contain medical discussions. In total, 95 subreddits were chosen. These subreddits contained 78,980 posts.</p>
        <p>Limiting posts to only relevant subreddits further decreased the false-positive rate from 29% to 15.5%. The accuracy rate in this step was 62.5% (SD 1.59%; SEM 0.793%), which was higher than in steps 1 and 3. Therefore, limiting posts to mainly medically relevant subreddits improved the relevance and accuracy compared to only excluding irrelevant subreddits.</p>
        <p>The relative frequency of each topic was calculated (<xref rid="figure3" ref-type="fig">Figure 3</xref>). STIs, eye disorders, anxiety, and pregnancy had the highest frequency at 7.44% (5876/78,980), 5.6% (4423/78,980), 5.43% (4289/78,980), and 5.09% (4020/78,890) of all posts, respectively. Interestingly, 10 topics had a 0% relative frequency: asthma, body dysmorphic disorder, cystic fibrosis, dementia, gestational diabetes, infectious mononucleosis, Lyme disease, testicular cancer, thyroid (unspecified), and vaccination. Nonmedical posts made up 3.87% (3057/78,890) of all posts. If including the <italic>nonmedical</italic> topic, 80% (63,184/78,890) of posts were categorized within the first 34% (28/82) of topics. The mean relative frequency of all topics was 1.22% (SD 0.15%).</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Relative frequency of all topics in descending order as determined by the topic assignment algorithm. The cumulative frequency of all topics is also shown. ADHD: attention-deficit/hyperactivity disorder; HPV: human papillomavirus; LGBTQ: lesbian, gay, bisexual, transgender, and queer; PCOS: polycystic ovary syndrome; PTSD: posttraumatic stress disorder; STI: sexually transmitted infection.</p>
          </caption>
          <graphic xlink:href="formative_v9i1e55309_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>As 34% (28/82) of the topics comprised 80% (63,184/78,890) of posts, this points to a skewed distribution of topics. In total, 61% (17/28) of those topics belonged to the top 4 medical disciplines (psychiatry and mental health; genitourinary and reproductive health; infectious diseases; and endocrinology, nutrition, and metabolism).</p>
        <p>Topics were grouped into 17 broader medical disciplines (<xref ref-type="table" rid="table2">Table 2</xref>) based on the categorization scheme of the chapter codes in the <italic>ICD-10</italic>, as described previously. The most discussed disciplines were psychiatry and mental health; genitourinary (related to the urinary and reproductive systems) and reproductive health; infectious diseases; and endocrinology, nutrition, and metabolism, whose posts, respectively, constituted 26.6% (21,009/78,980), 13.6% (10,741/78,980), 8.95% (7069/78,980), and 8.91% (7037/78,980) of all analyzed posts. Psychiatry and mental health comprised most posts. Interestingly, most of the other medical disciplines were discussed with similar relative frequencies. The next most common medical discipline was hematology and immunology with a 5.88% (4644/78,890) relative frequency. The medical discipline with the lowest relative frequency was otolaryngology (related to medicine dealing with the ear, nose, and throat) at 0.57% (450/78,890).</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>The relative frequency of the broader medical disciplines, into which the medical topics were sorted, shown in descending order.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <col width="0"/>
            <thead>
              <tr valign="top">
                <td>Medical discipline</td>
                <td>Relative frequency</td>
                <td>
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Psychiatry and mental health</td>
                <td>0.266</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>Genitourinary and reproductive health</td>
                <td>0.136</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>Infectious diseases</td>
                <td>0.0895</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>Endocrinology, nutrition, and metabolism</td>
                <td>0.0891</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>Hematology and immunology</td>
                <td>0.0588</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>Ophthalmology</td>
                <td>0.0572</td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>Musculoskeletal and connective tissue conditions</td>
                <td colspan="2">0.0476</td>
              </tr>
              <tr valign="top">
                <td>Gastroenterology</td>
                <td colspan="2">0.0426</td>
              </tr>
              <tr valign="top">
                <td>Dermatology</td>
                <td colspan="2">0.0410</td>
              </tr>
              <tr valign="top">
                <td>Nonmedical</td>
                <td colspan="2">0.0387</td>
              </tr>
              <tr valign="top">
                <td>Neurology</td>
                <td colspan="2">0.0373</td>
              </tr>
              <tr valign="top">
                <td>Cardiovascular</td>
                <td colspan="2">0.0353</td>
              </tr>
              <tr valign="top">
                <td>Pulmonology</td>
                <td colspan="2">0.0183</td>
              </tr>
              <tr valign="top">
                <td>Medical; other</td>
                <td colspan="2">0.0160</td>
              </tr>
              <tr valign="top">
                <td>Neoplasms</td>
                <td colspan="2">0.0157</td>
              </tr>
              <tr valign="top">
                <td>Dentistry</td>
                <td colspan="2">0.0095</td>
              </tr>
              <tr valign="top">
                <td>Otolaryngology</td>
                <td colspan="2">0.0022</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>The most common topics in the 4 most discussed medical disciplines are shown in <xref ref-type="table" rid="table3">Table 3</xref>. Within the medical discipline of psychiatry and mental health, the 3 most common topics were anxiety, addiction and drug use, and attention-deficit/hyperactivity disorder (ADHD) with relative frequencies of 20.42% (4289/21,009), 17.3% (3635/21,009), and 15.1% (3172/21,009), respectively. In the medical discipline of infectious diseases, the most common topic by a significant margin was STIs, making up 83.12% (5876/7069) of infectious disease posts. HIV and influenza made up 11.01% (778/7069) and 3.3% (233/7069) of posts, respectively. In genitourinary and reproductive health, pregnancy was the most common topic, comprising 37.43% (4020/10,741) of genitourinary and reproductive health posts, followed by menstrual cycle (1665/10,741, 15.5%) and male reproductive health (591/10,741, 5.5%). Finally, posts within the medical discipline of endocrinology, nutrition, and metabolism were more evenly distributed across topics. Hypothyroidism had the greatest number of posts (2013/7037, 28.61%), followed by vitamins (1534/7037, 21.8%) and diabetes (1316/7037, 18.7%).</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Relative frequency of topics on Reddit, as determined by our algorithm, within medical disciplines. The breakdown of the relative frequency of topics in the 4 most prevalent medical disciplines is as follows: psychiatry and mental health; genitourinary and reproductive health; infectious diseases; and endocrinology, nutrition, and metabolism. The medical disciplines are also shown in descending order by prevalence.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="670"/>
            <col width="300"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Medical discipline and topic</td>
                <td>Relative frequency</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Psychiatry and mental health</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Anxiety</td>
                <td>0.203</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Addiction and drug use</td>
                <td>0.169</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>ADHD<sup>a</sup></td>
                <td>0.151</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Obsessive-compulsive disorder</td>
                <td>0.139</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Abuse</td>
                <td>0.094</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>PTSD<sup>b</sup></td>
                <td>0.087</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Depression</td>
                <td>0.079</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Alcoholism</td>
                <td>0.031</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Autism</td>
                <td>0.010</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Psychiatry</td>
                <td>0.0090</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Tobacco use</td>
                <td>0.0085</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LGBTQ<sup>c</sup> health</td>
                <td>0.0051</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Body dysmorphic disorder</td>
                <td>0.0015</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Dementia</td>
                <td>0.0013</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Genitourinary and reproductive health</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Pregnancy</td>
                <td>0.376</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Menstrual cycle</td>
                <td>0.160</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male reproductive health</td>
                <td>0.088</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Testosterone use</td>
                <td>0.081</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Urinary tract infection</td>
                <td>0.068</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>HPV<sup>d</sup></td>
                <td>0.053</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Miscarriage</td>
                <td>0.044</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female reproductive health</td>
                <td>0.042</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Endometriosis</td>
                <td>0.035</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Benign prostatic hypertrophy</td>
                <td>0.028</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Nephrology; unspecified</td>
                <td>0.024</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Gestational diabetes</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Testicular torsion</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Infectious diseases</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>STIs<sup>e</sup></td>
                <td>0.831</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>HIV</td>
                <td>0.118</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Influenza</td>
                <td>0.039</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Measles</td>
                <td>0.013</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Infectious mononucleosis</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Lyme disease</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Vaccination</td>
                <td>0</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Endocrinology, nutrition, and metabolism</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hypothyroidism</td>
                <td>0.286</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Vitamins</td>
                <td>0.216</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Diabetes</td>
                <td>0.188</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Dieting</td>
                <td>0.178</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>PCOS<sup>f</sup></td>
                <td>0.078</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Bodybuilding</td>
                <td>0.029</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Obesity</td>
                <td>0.022</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hyperthyroidism</td>
                <td>0.002</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Endocrinology</td>
                <td>0.001</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Thyroid; unspecified</td>
                <td>0</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>ADHD: attention-deficit/hyperactivity disorder.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>PTSD: posttraumatic stress disorder.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>LGBTQ: lesbian, gay, bisexual, transgender, and queer.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>HPV: human papillomavirus.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>STI: sexually transmitted infection.</p>
            </fn>
            <fn id="table3fn6">
              <p><sup>f</sup>PCOS: polycystic ovary syndrome.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Posts per Subreddit</title>
        <p>Of the 95 subreddits identified in step 4, a total of 10 (11%) did not contain any posts that were assigned to our topics and were excluded, leaving 85 final subreddits. These 85 subreddits contained 78,980 posts (<xref ref-type="table" rid="table4">Table 4</xref>). The subreddits with the most posts were those that we describe as <italic>general</italic>, or non–topic-specific, subreddits. The top 10 subreddits with the most posts included 6 general subreddits: <italic>r/askreddit</italic>, <italic>r/askdocs</italic>, <italic>r/amitheasshole</italic>, <italic>r/medical</italic>, <italic>r/legaladvice</italic>, and <italic>r/advice</italic>. The most popular subreddit was <italic>r/askreddit</italic> with 26.7% (21,086/78,980) of posts, followed by <italic>r/askdocs</italic> with 12.02% (9496/78,980) of posts. A total of 61.93% (48,912/78,890) of the posts analyzed were found in the top 5 subreddits by number of posts, and 79.91% (63,112/78,890) were found in the top 15 subreddits.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Subreddits by number of posts analyzed showing the relative differences in the number of posts in each subreddit (N=78,980).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <col width="0"/>
            <thead>
              <tr valign="top">
                <td>Subreddit</td>
                <td>Posts analyzed, n (%)</td>
                <td>
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>r/askreddit</td>
                <td colspan="2">21,086 (26.7)</td>
              </tr>
              <tr valign="top">
                <td>r/askdocs</td>
                <td colspan="2">9496 (12.02)</td>
              </tr>
              <tr valign="top">
                <td>r/amitheasshole</td>
                <td colspan="2">5473 (6.93)</td>
              </tr>
              <tr valign="top">
                <td>r/relationship_advice</td>
                <td colspan="2">5322 (6.74)</td>
              </tr>
              <tr valign="top">
                <td>r/relationships</td>
                <td colspan="2">2775 (3.51)</td>
              </tr>
              <tr valign="top">
                <td>r/medical</td>
                <td colspan="2">2495 (3.16)</td>
              </tr>
              <tr valign="top">
                <td>r/skincareaddiction</td>
                <td colspan="2">2268 (2.87)</td>
              </tr>
              <tr valign="top">
                <td>r/legaladvice</td>
                <td colspan="2">2227 (2.82)</td>
              </tr>
              <tr valign="top">
                <td>r/advice</td>
                <td colspan="2">2150 (2.72)</td>
              </tr>
              <tr valign="top">
                <td>r/teenagers</td>
                <td colspan="2">1974 (2.5)</td>
              </tr>
              <tr valign="top">
                <td>r/ADHD</td>
                <td colspan="2">1876 (2.38)</td>
              </tr>
              <tr valign="top">
                <td>r/babybumps</td>
                <td colspan="2">1775 (2.25)</td>
              </tr>
              <tr valign="top">
                <td>r/Testosterone</td>
                <td colspan="2">1746 (2.21)</td>
              </tr>
              <tr valign="top">
                <td>r/STD</td>
                <td colspan="2">1345 (1.7)</td>
              </tr>
              <tr valign="top">
                <td>r/Anxiety</td>
                <td colspan="2">1215 (1.54)</td>
              </tr>
              <tr valign="top">
                <td>r/Depression</td>
                <td colspan="2">1193 (1.51)</td>
              </tr>
              <tr valign="top">
                <td>r/pregnant</td>
                <td colspan="2">1166 (1.48)</td>
              </tr>
              <tr valign="top">
                <td>r/birthcontrol</td>
                <td colspan="2">1102 (1.4)</td>
              </tr>
              <tr valign="top">
                <td>r/childfree</td>
                <td colspan="2">966 (1.22)</td>
              </tr>
              <tr valign="top">
                <td>r/Hypothyroidism</td>
                <td colspan="2">880 (1.11)</td>
              </tr>
              <tr valign="top">
                <td>r/fitness</td>
                <td colspan="2">778 (0.99)</td>
              </tr>
              <tr valign="top">
                <td>r/MentalHealth</td>
                <td colspan="2">741 (0.94)</td>
              </tr>
              <tr valign="top">
                <td>r/Diabetes</td>
                <td colspan="2">699 (0.89)</td>
              </tr>
              <tr valign="top">
                <td>r/Dentistry</td>
                <td colspan="2">602 (0.76)</td>
              </tr>
              <tr valign="top">
                <td>r/science</td>
                <td colspan="2">489 (0.62)</td>
              </tr>
              <tr valign="top">
                <td>r/diagnoseme</td>
                <td colspan="2">467 (0.59)</td>
              </tr>
              <tr valign="top">
                <td>r/Infertility</td>
                <td colspan="2">446 (0.56)</td>
              </tr>
              <tr valign="top">
                <td>r/SuicideWatch</td>
                <td colspan="2">429 (0.54)</td>
              </tr>
              <tr valign="top">
                <td>r/Optometry</td>
                <td colspan="2">410 (0.52)</td>
              </tr>
              <tr valign="top">
                <td>r/Ibs</td>
                <td colspan="2">391 (0.5)</td>
              </tr>
              <tr valign="top">
                <td>r/CrohnsDisease</td>
                <td colspan="2">376 (0.48)</td>
              </tr>
              <tr valign="top">
                <td>r/Cancer</td>
                <td colspan="2">349 (0.44)</td>
              </tr>
              <tr valign="top">
                <td>r/Fibromyalgia</td>
                <td colspan="2">318 (0.4)</td>
              </tr>
              <tr valign="top">
                <td>r/ChronicPain</td>
                <td colspan="2">300 (0.38)</td>
              </tr>
              <tr valign="top">
                <td>r/MultipleSclerosis</td>
                <td colspan="2">279 (0.35)</td>
              </tr>
              <tr valign="top">
                <td>r/Aspergers</td>
                <td colspan="2">272 (0.34)</td>
              </tr>
              <tr valign="top">
                <td>r/bpd</td>
                <td colspan="2">235 (0.3)</td>
              </tr>
              <tr valign="top">
                <td>r/SleepApnea</td>
                <td colspan="2">230 (0.29)</td>
              </tr>
              <tr valign="top">
                <td>r/BipolarReddit</td>
                <td colspan="2">201 (0.25)</td>
              </tr>
              <tr valign="top">
                <td>r/cfs</td>
                <td colspan="2">188 (0.24)</td>
              </tr>
              <tr valign="top">
                <td>r/askdoctorsmeeee</td>
                <td colspan="2">175 (0.22)</td>
              </tr>
              <tr valign="top">
                <td>r/askdoctors</td>
                <td colspan="2">150 (0.19)</td>
              </tr>
              <tr valign="top">
                <td>r/Rheumatoid</td>
                <td colspan="2">127 (0.16)</td>
              </tr>
              <tr valign="top">
                <td>r/medicine</td>
                <td colspan="2">125 (0.16)</td>
              </tr>
              <tr valign="top">
                <td>r/Eczema</td>
                <td colspan="2">120 (0.15)</td>
              </tr>
              <tr valign="top">
                <td>r/Asthma</td>
                <td colspan="2">118 (0.15)</td>
              </tr>
              <tr valign="top">
                <td>r/InterstitialCystitis</td>
                <td colspan="2">117 (0.15)</td>
              </tr>
              <tr valign="top">
                <td>r/Nutrition</td>
                <td colspan="2">115 (0.15)</td>
              </tr>
              <tr valign="top">
                <td>r/Dementia</td>
                <td colspan="2">86 (0.11)</td>
              </tr>
              <tr valign="top">
                <td>r/askscience</td>
                <td colspan="2">84 (0.11)</td>
              </tr>
              <tr valign="top">
                <td>r/Healthcare</td>
                <td colspan="2">80 (0.1)</td>
              </tr>
              <tr valign="top">
                <td>r/StopSmoking</td>
                <td colspan="2">79 (0.1)</td>
              </tr>
              <tr valign="top">
                <td>r/Dysautonomia</td>
                <td colspan="2">77 (0.1)</td>
              </tr>
              <tr valign="top">
                <td>r/Psoriasis</td>
                <td colspan="2">75 (0.09)</td>
              </tr>
              <tr valign="top">
                <td>r/Keratoconus</td>
                <td colspan="2">72 (0.09)</td>
              </tr>
              <tr valign="top">
                <td>r/Pharmacy</td>
                <td colspan="2">59 (0.07)</td>
              </tr>
              <tr valign="top">
                <td>r/Vegetarian</td>
                <td colspan="2">52 (0.07)</td>
              </tr>
              <tr valign="top">
                <td>r/Massage</td>
                <td colspan="2">48 (0.06)</td>
              </tr>
              <tr valign="top">
                <td>r/KidneyStones</td>
                <td colspan="2">47 (0.06)</td>
              </tr>
              <tr valign="top">
                <td>r/GravesDisease</td>
                <td colspan="2">40 (0.05)</td>
              </tr>
              <tr valign="top">
                <td>r/Menieres</td>
                <td colspan="2">32 (0.04)</td>
              </tr>
              <tr valign="top">
                <td>r/Pilonidalcyst</td>
                <td colspan="2">31 (0.04)</td>
              </tr>
              <tr valign="top">
                <td>r/Posture</td>
                <td colspan="2">30 (0.04)</td>
              </tr>
              <tr valign="top">
                <td>r/Paleo</td>
                <td colspan="2">27 (0.03)</td>
              </tr>
              <tr valign="top">
                <td>r/Gastroparesis</td>
                <td colspan="2">24 (0.03)</td>
              </tr>
              <tr valign="top">
                <td>r/Hemophilia</td>
                <td colspan="2">22 (0.03)</td>
              </tr>
              <tr valign="top">
                <td>r/Psychology</td>
                <td colspan="2">17 (0.02)</td>
              </tr>
              <tr valign="top">
                <td>r/TroubledTeens</td>
                <td colspan="2">16 (0.02)</td>
              </tr>
              <tr valign="top">
                <td>r/PancreaticCancer</td>
                <td colspan="2">13 (0.02)</td>
              </tr>
              <tr valign="top">
                <td>r/Amblyopia</td>
                <td colspan="2">11 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/LactoseIntolerant</td>
                <td colspan="2">9 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/AlternativeHealth</td>
                <td colspan="2">8 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/NaturalBeauty</td>
                <td colspan="2">7 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/PublicHealth</td>
                <td colspan="2">6 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/Transplant</td>
                <td colspan="2">5 (0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/CareGiverSupport</td>
                <td colspan="2">3 (&lt;0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/hepc</td>
                <td colspan="2">3 (&lt;0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/chd</td>
                <td colspan="2">2 (&lt;0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/Flu</td>
                <td colspan="2">2 (&lt;0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/Juicing</td>
                <td colspan="2">1 (&lt;0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/Pescetarian</td>
                <td colspan="2">1 (&lt;0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/UKHealthcare</td>
                <td colspan="2">1 (&lt;0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/Dystonia</td>
                <td colspan="2">1 (&lt;0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/ItsNeverLupus</td>
                <td colspan="2">1 (&lt;0.01)</td>
              </tr>
              <tr valign="top">
                <td>r/MacularDegeneration</td>
                <td colspan="2">1 (&lt;0.01)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>General Subreddits Versus Topic-Specific Subreddits</title>
        <p>Subreddits that we defined as <italic>general</italic> were those that did not focus on a specific health topic. These 15 subreddits were <italic>r/askreddit</italic>, <italic>r/askdocs</italic>, <italic>r/amitheasshole</italic>, <italic>r/relationship_advice</italic>, <italic>r_relationships</italic>, <italic>r/medical</italic>, <italic>r/legaladvice</italic>, <italic>r/advice</italic>, <italic>r/teenagers</italic>, <italic>r/fitness</italic>, <italic>r/science</italic>, <italic>r/diagnoseme</italic>, <italic>r/askdoctorsmeeee</italic>, <italic>r/askdoctors</italic>, and <italic>r/medicine</italic>. Compared to topic-specific subreddits, a wider variety of topics was represented in these subreddits, and no one topic dominated over other topics in each subreddit. We identified the top 5 topics by number of posts in each subreddit. Among the general subreddits, these topics comprised, on average, 41.1% of posts (SD 12.9%; 95% CI 28.2%-54%). For comparison, among topic-specific subreddits, the top 5 topics on average comprised 70.3% of posts (SD 38.3%; 95% CI 32%-100%).</p>
        <p>In 67% (10/15) of the general subreddits, STIs was one of the top 5 topics (<xref ref-type="table" rid="table5">Table 5</xref>). Notably, the second most prevalent topic in <italic>r/science</italic> was human papillomavirus, whereas the most prevalent topic in <italic>r/healthcare</italic> (not one of the top 15 general subreddits) was medical billing. Interestingly, we also noted that the top 5 topics in <italic>r/askreddit</italic>, which is not specifically targeted toward health issues, were musculoskeletal conditions, eye disorders, ADHD, addiction and drug use, and allergies. For comparison, in <italic>r/askdocs</italic>, the most prevalent topics were STIs, dermatology, musculoskeletal conditions, allergies, and anxiety. Mental health topics were common in the general subreddits. Anxiety appeared as a top-5 topic in 53% (8/15) of the general subreddits. In those 8 subreddits, an average of 6.27% (SD 0.017%) of all posts were assigned to the topic of anxiety. Addiction and drug use appeared as a top-5 topic in 33% (5/15) of the general subreddits, and an average of 10.9% (SD 5.30%) of all posts in those 5 subreddits were assigned to that topic. On the other hand, we found that topic-specific subreddits often had the topic of the same name as the most assigned topic (eg, the topic of ADHD would be the most assigned topic in the subreddit <italic>r/ADHD</italic>; <xref ref-type="table" rid="table6">Table 6</xref>).</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>The top 5 topics by number of posts in the top 15 general subreddits (subreddits without a specific health-related topic). A description of the subreddit and the total number of posts in the subreddit are provided (N=78,980).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="310"/>
            <col width="140"/>
            <col width="400"/>
            <thead>
              <tr valign="top">
                <td>Subreddit</td>
                <td>Description</td>
                <td>Posts, n (%)</td>
                <td>Top 5 topics in subreddit</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>r/askreddit</td>
                <td>Open question-and-answer forum</td>
                <td>21,086 (26.7)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Musculoskeletal conditions (n=1673 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Eye disorder (n=1556 posts)</p>
                    </list-item>
                    <list-item>
                      <p>ADHD<sup>a</sup> (n=1043 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Addiction and drug use (n=1001 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Allergies (937 n=posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/askdocs</td>
                <td>Questions and answers with verified medical professionals</td>
                <td>9496 (12.02)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>STIs<sup>b</sup> (n=748 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Dermatology; unspecified (n=646 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Musculoskeletal conditions (n=598 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Allergies (n=465 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=435 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/amItheasshole</td>
                <td>Users post stories to “find out if [they] were wrong”</td>
                <td>5473 (6.93)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>STIs (n=637 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=461 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Abuse (n=400 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Nonmedical (n=353 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Pregnancy (n=334 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/relationship_advice</td>
                <td>Relationship-based discussions</td>
                <td>5322 (6.74)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>STIs (n=1190 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Abuse (n=530 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Dating (n=497 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Obsessive-compulsive disorder (n=374 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=358)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/relationships</td>
                <td>Interpersonal relationship–based discussion</td>
                <td>2775 (3.51)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>STIs (n=420 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Abuse (n=390 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Obsessive-compulsive disorder (n=281 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Dating (n=248 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=222 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/medical</td>
                <td>Medical question–based discussion</td>
                <td>2495 (3.16)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Dermatology; unspecified (n=235 posts)</p>
                    </list-item>
                    <list-item>
                      <p>STIs (n=175 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Musculoskeletal conditions (n=173 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Allergies (n=151 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Eye disorder (n=114 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/legaladvice</td>
                <td>Forum to ask “simple legal questions”</td>
                <td>2227 (2.82)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Addiction and drug use (n=401 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Medical billing (n=373 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Musculoskeletal conditions (n=110 posts)</p>
                    </list-item>
                    <list-item>
                      <p>PTSD<sup>c</sup> (n=109 posts)</p>
                    </list-item>
                    <list-item>
                      <p>STIs (n=102 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/advice</td>
                <td>Advice forum</td>
                <td>2134 (2.7)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Obsessive-compulsive disorder (n=186 posts)</p>
                    </list-item>
                    <list-item>
                      <p>STIs (n=184 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=168 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Addiction and drug use (n=163 posts)</p>
                    </list-item>
                    <list-item>
                      <p>ADHD (n=144 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/teenagers</td>
                <td>Intended for users aged 13-19 years to discuss age-appropriate subjects</td>
                <td>1974 (2.5)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Dermatology; unspecified (n=591 posts)</p>
                    </list-item>
                    <list-item>
                      <p>ADHD (n=154 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Eye disorder (n=101 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Depression (n=91 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=73 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/fitness</td>
                <td>Physical fitness–based discussion</td>
                <td>778 (0.99)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Musculoskeletal conditions (n=152 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Dieting (n=77 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Bodybuilding (n=69 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Gallbladder disorder (n=46 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Testosterone use (n=37 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/science</td>
                <td>Forum for new scientific research</td>
                <td>489 (0.62)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Addiction and drug use (n=48 posts)</p>
                    </list-item>
                    <list-item>
                      <p>HPV<sup>d</sup> (n=29 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=27 posts)</p>
                    </list-item>
                    <list-item>
                      <p>STIs (n=23 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Obsessive-compulsive disorder (n=19 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/diagnoseme</td>
                <td>Medical question–based discussion</td>
                <td>479 (0.61)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Dermatology; unspecified (n=52 posts)</p>
                    </list-item>
                    <list-item>
                      <p>STIs (n=42 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Allergies (n=38 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Musculoskeletal conditions (n=28 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Hypothyroidism (n=25 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/askdoctorsmeeee</td>
                <td>Forum for medical questions</td>
                <td>175 (0.22)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Dermatology; unspecified (n=14 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Musculoskeletal conditions (n=14 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Allergies (n=12 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Arrhythmia (n=9 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Hypothyroidism (n=9 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/askdoctors</td>
                <td>Forum for medical advice</td>
                <td>150 (0.19)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>STIs (n=13 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Dermatology; unspecified (n=11 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Allergies (n=8 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=8 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Gallbladder disorder (n=8 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/medicine</td>
                <td>Forum for physicians to discuss medicine</td>
                <td>125 (0.16)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Addiction and drug use (n=18 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Pregnancy (n=8 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anemia (n=6 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Gallbladder disorder (n=5 posts)</p>
                    </list-item>
                    <list-item>
                      <p>HIV (n=5 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table5fn1">
              <p><sup>a</sup>ADHD: attention-deficit/hyperactivity disorder.</p>
            </fn>
            <fn id="table5fn2">
              <p><sup>b</sup>STI: sexually transmitted infection.</p>
            </fn>
            <fn id="table5fn3">
              <p><sup>c</sup>PTSD: posttraumatic stress disorder.</p>
            </fn>
            <fn id="table5fn4">
              <p><sup>d</sup>HPV: human papillomavirus.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table6">
          <label>Table 6</label>
          <caption>
            <p>The top 5 topics by number of posts in the top 15 topic-specific subreddits (describing a certain health-related topic). A description of the subreddit and the total number of posts in the subreddit are provided (N=78,980).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="150"/>
            <col width="310"/>
            <col width="140"/>
            <col width="400"/>
            <thead>
              <tr valign="top">
                <td>Subreddit</td>
                <td>Description</td>
                <td>Posts, n (%)</td>
                <td>Top 5 topics in each subreddit</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>r/skincareaddiction</td>
                <td>Broad forum to discuss skin</td>
                <td>2268 (2.87)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Eye disorder (n=1226 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Dermatology; unspecified (n=273 posts)</p>
                    </list-item>
                    <list-item>
                      <p>PCOS<sup>a</sup> (n=225 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Allergies (n=87 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Eczema (n=73 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/testosterone</td>
                <td>Testosterone replacement therapy and testosterone levels</td>
                <td>1746 (2.21)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Vitamins (n=370 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Testosterone use (n=264 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Hypothyroidism (n=171 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Pregnancy (n=105 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anemia (n=103 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/babybumps</td>
                <td>Pregnancy-related discussion</td>
                <td>1775 (2.25)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Pregnancy (n=819 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Musculoskeletal conditions (n=69 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=58 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Menstrual cycle (n=58 posts)</p>
                    </list-item>
                    <list-item>
                      <p>STIs<sup>b</sup> (n=49 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/ADHD</td>
                <td>Forum for people with ADHD<sup>c</sup> to exchange stories and strategies</td>
                <td>1807 (2.29)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>ADHD (n=944 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Addiction and drug use (n=199 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Obsessive-compulsive disorder (n=112 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Depression (n=91 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=87 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/STD</td>
                <td>Forum to discuss STDs<sup>d</sup></td>
                <td>1611 (2.04)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>STIs (n=1158 posts)</p>
                    </list-item>
                    <list-item>
                      <p>HIV (n=75 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=54 posts)</p>
                    </list-item>
                    <list-item>
                      <p>HPV<sup>e</sup> (n=48 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Respiratory infection (n=32 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/Pregnant</td>
                <td>Forum to discuss pregnancy</td>
                <td>1166 (1.48)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Pregnancy (n=494 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Menstrual cycle (n=92 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Hematology (n=50 posts)</p>
                    </list-item>
                    <list-item>
                      <p>STIs (n=47 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=40 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/Depression</td>
                <td>Support for those struggling with a depressive disorder</td>
                <td>1193 (1.51)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Depression (n=255 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Obsessive-compulsive disorder (n=236 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=129 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Addiction and drug use (n=940 posts)</p>
                    </list-item>
                    <list-item>
                      <p>ADHD (n=63 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/Anxiety</td>
                <td>Support for those struggling with anxiety</td>
                <td>1215 (1.54)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Anxiety (n=628 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Obsessive-compulsive disorder (n=165 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Arrhythmia (n=55 posts)</p>
                    </list-item>
                    <list-item>
                      <p>PTSD<sup>f</sup> (n=53 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Eye disorder (n=31 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/birthcontrol</td>
                <td>Forum to discuss birth control</td>
                <td>1102 (1.4)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Menstrual cycle (n=521 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Pregnancy (n=180 posts)</p>
                    </list-item>
                    <list-item>
                      <p>STIs (n=70 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=26 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Musculoskeletal conditions (n=24 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/Childfree</td>
                <td>Forum for those who choose to not have children</td>
                <td>966 (1.22)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Pregnancy (n=580 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Menstrual cycle (n=58 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Male reproductive health (n=32 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Abuse (n=22 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=18 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/Hypothyroidism</td>
                <td>Forum for those with hypothyroidism</td>
                <td>779 (0.99)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Hypothyroidism (n=519 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anemia (n=69 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Dieting (n=29 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Vitamins (n=23 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=19 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/MentalHealth</td>
                <td>Moderated forum to discuss mental health issues</td>
                <td>741 (0.94)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Obsessive-compulsive disorder (n=208 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anxiety (n=126 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Depression (n=73 posts)</p>
                    </list-item>
                    <list-item>
                      <p>ADHD (n=57 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Addiction and drug use (n=43 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/Dentistry</td>
                <td>Forum for dental professionals</td>
                <td>683 (0.86)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Dentistry (n=418 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Dermatology; unspecified (n=28 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Allergies (n=24 posts)</p>
                    </list-item>
                    <list-item>
                      <p>STIs (n=23 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Musculoskeletal conditions (n=19 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/Diabetes</td>
                <td>Forum for those living with diabetes</td>
                <td>702 (0.89)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Diabetes (n=491 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Eye disorder (n=35 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Anemia (n=23 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Dieting (n=19 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Vitamins (n=15 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
              <tr valign="top">
                <td>r/Infertility</td>
                <td>Forum for those dealing with infertility for all reasons</td>
                <td>446 (0.56)</td>
                <td>
                  <list list-type="bullet">
                    <list-item>
                      <p>Pregnancy (n=110 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Menstrual cycle (n=34 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Vitamins (n=33 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Hypothyroidism (n=29 posts)</p>
                    </list-item>
                    <list-item>
                      <p>Endometriosis (n=22 posts)</p>
                    </list-item>
                  </list>
                </td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table6fn1">
              <p><sup>a</sup>PCOS: polycystic ovary syndrome.</p>
            </fn>
            <fn id="table6fn2">
              <p><sup>b</sup>STI: sexually transmitted infection.</p>
            </fn>
            <fn id="table6fn3">
              <p><sup>c</sup>ADHD: attention-deficit/hyperactivity disorder.</p>
            </fn>
            <fn id="table6fn4">
              <p><sup>d</sup>STD: sexually transmitted disease.</p>
            </fn>
            <fn id="table6fn5">
              <p><sup>e</sup>HPV: human papillomavirus.</p>
            </fn>
            <fn id="table6fn6">
              <p><sup>f</sup>PTSD: posttraumatic stress disorder.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Medical Disciplines Divided by Subreddit</title>
        <p>We also analyzed the breakdown of posts in each subreddit differentiated by medical discipline (Figure S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). The relative frequency of medical disciplines in each subreddit was calculated by dividing the number of posts in a medical discipline by the total number of analyzed posts in that subreddit. Our analysis showed that many subreddits included posts about psychiatry and mental health. This mirrors the breakdown of medical disciplines overall as most posts belonged to that discipline. Some subreddits predominantly contained posts belonging to other medical disciplines. In those cases, the medical discipline often correlated with the subreddit (eg, in <italic>r/hypothyroidism</italic>, most posts belonged to the endocrinology, nutrition, and metabolism medical discipline). However, most subreddits comprised posts from multiple medical disciplines.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Most Prevalent Medical Topics and Disciplines</title>
        <p>By using markers of medical topics identified from broader samples of user data to categorize social media posts into specific diseases, previous studies have been able to predict diagnoses using social media information [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. We accomplished a similar goal in our study by identifying topic keywords and using those to assign topics to posts. From there, our analysis revealed which disciplines were most prevalent across Reddit. Similarly to previous studies, we also used keywords to categorize this form of data into medical topics, but in this case, we did this on a broader scale, sorting data into all possible medical disciplines and generally not excluding posts that did not meet predetermined categories.</p>
        <p>The 4 medical disciplines with the greatest proportion of posts were psychiatry and mental health; genitourinary and reproductive health; infectious diseases; and endocrinology, nutrition, and metabolism. We note the fact that psychiatry and mental health had approximately twice as many posts as the next highest medical discipline, genitourinary and reproductive health (21,009/79,980, 26.6% vs 10,741/78,980, 13.6% of posts) as another sign that discussion of mental health is common on Reddit.</p>
        <p>Psychiatry and mental health, as a discipline, was the most prevalent. In addition to posts about anxiety, this medical discipline comprised posts about depression, addiction, alcoholism, and tobacco use. There were many posts about drug use, drug testing at work, and how drugs would affect other health conditions. Overall, the medical discipline of psychiatry and mental health emphasized the amount of concern that people have about mental health topics and that they were willing to discuss their issues online. The large proportion of posts being about mental health raises the question of whether there is insufficient access to mental health services, whether online discussion of mental health is predominant over other health topics because of anonymity, or both.</p>
        <p>Within this discipline, anxiety was another medical topic that frequently appeared, making up 5.43% (4289/78,980) of all posts and being in the top 5 topics in both general and topic-specific subreddits. Interestingly, anxiety was one of the most frequent topics not only in subreddits related to mental health but also in <italic>r/PancreaticCancer</italic>, <italic>r/STD</italic>, and <italic>r/juicing</italic>. Anxiety is a broad topic. Posts in this topic ranged from those about sharing experiences fighting melanoma to anxiety due to marijuana-triggered hallucinations to broad descriptions of “head pressure, headache, jaw pain, throat tension.” Because the description of anxiety is open to interpretation, capturing which posts discuss anxiety is difficult and will result in a variety of posts that mention anxious feelings and worry, but the main subject of the post may not necessarily be anxiety.</p>
        <p>We note that the most prevalent medical disciplines and topics can entail feelings of shame and embarrassment, be highly sensitive, or evoke a need for secrecy [<xref ref-type="bibr" rid="ref33">33</xref>-<xref ref-type="bibr" rid="ref35">35</xref>]. STIs was the most common topic, making up 7.44% (5876/78,980) of all posts. STIs had a significantly higher relative frequency than the next most common topic, eye disorders. Posts on this topic included many situational descriptions of suspected STIs. An example of an STI post is as follows:</p>
        <disp-quote>
          <p>[These] past couple of weeks, my girlfriend (we are in a monogamous relationship) found out that she was having light stringy brown discharge midway through her period cycles...So she went to the doctor and the doctor has prescribed her 1g Azithromycin (one time) and a 1 week course of Metrogyl 400 gms...The doctor also adviced [sic] her that I should take only the Azithromycin as I could have the infection as well (no blood tests or similar were done, the doctor did a physical examination)...</p>
        </disp-quote>
        <p>The medical discipline of endocrinology, nutrition, and metabolism, which included posts about hypothyroidism, vitamins, and diabetes, among others, presented an interesting category. Posts discussed checking vitamin D levels and supplements. However, many posts also overlapped with the topic of pregnancy, such as checking vitamin levels during pregnancy and hormone levels. Therefore, it was difficult to parse whether all these posts were truly about endocrinology, nutrition, and metabolism. We also noticed that there were posts mentioning thyroid problems or diseases that were not specific to hypo- or hyperthyroidism. While these posts were more often categorized under hypothyroidism, the endocrine, nutrition, and metabolism medical discipline more accurately captured them under a broader category.</p>
        <p>Overall, Reddit holds advantages over other social media platforms because its culture trends toward anonymity. Authors have discussed how the anonymity of communication over the internet reduces social desirability bias and social anxiety. Users are more disinhibited to discuss things openly [<xref ref-type="bibr" rid="ref5">5</xref>]. Other studies have suggested that the internet is useful for collecting self-reports on risky health behaviors such as alcohol use, drug use, and smoking. Respondents accurately self-reported behaviors online, even ones that were undesirable, because of the perception of privacy [<xref ref-type="bibr" rid="ref36">36</xref>]. It is established that social media sites with a culture of anonymity allow people to talk about sensitive issues online without fear of social desirability bias. Our study leverages that culture to gather a broader look at all medical disciplines rather than a predetermined set of medical topics. Our methods classified user data into those topics iteratively and broadly into all possible medical disciplines. Therefore, our findings expand on the literature by highlighting the most prevalent disciplines of conversation in a platform-wide study.</p>
        <p>Interestingly, the top 5 topics may not be considered top health topics by health care providers. In a recent metric published by Blue Cross Blue Shield (Blue Cross Blue Shield Health Index), the top 10 health topics that had the greatest impact on quality of life in the United States did not include any of the topics that we mentioned previously. Therefore, our study may show that there is a different set of online topics, or it may reinforce that mining internet data reveals a different set of health concerns from those traditionally discussed or considered to be major health issues.</p>
      </sec>
      <sec>
        <title>The Distribution of Topics</title>
        <p>The aforementioned skewed distribution of topics suggests to us that conversation on Reddit is concentrated in a minority of discussion topics. This correlates with our supposition that users, when discussing health topics, overwhelmingly post about issues related to mental health, reproductive health, and infectious diseases, as well as endocrine, metabolic, and nutritional issues. The relative paucity of other topics may suggest that these are not discussed either in the general subreddits we focused on or in the topic-specific subreddits in the selection of health-related subreddits provided by Reddit but may be discussed in other subreddits.</p>
        <p>As previously noted, 10 topics had no posts assigned to them. This meant that some topics that were created inductively during manual post review did not have any posts assigned to them during automatic topic assignment in the 1-year dataset. This invites us to investigate why certain topics would not have posts assigned to them. One reason is that posts in the subreddits included in the final analysis may not have been assigned to those topics. Another reason is that posts about a certain topic, for example, vaccination, may have also discussed measles, influenza, or human papillomavirus and, subsequently, were assigned to other topics, such as upper respiratory infection and STIs.</p>
        <p>In general, users appeared more willing to talk about subjects that would otherwise be uncomfortable to discuss in person. This is in line with other studies that have examined how people are more willing to talk about chronic diseases on social media. They are also willing to share their disease experience in detail. Previous work has found that, on certain disease-oriented subreddits, users freely discuss disease-anatomy relationships, such as cancer-lymph and asthma-lung relationships. The authors write that this openness on subreddits may stem from a desire to find others who share their experience of the disease [<xref ref-type="bibr" rid="ref24">24</xref>] and users feel reassured by the subreddits’ shared experiences.</p>
      </sec>
      <sec>
        <title>Giving Advice</title>
        <p>A subset of subreddits include those where users can post a question with the expectation that a subject matter expert will provide an answer while also being open to public input. On subreddits such as <italic>r/askdocs</italic> and <italic>r/askdoctorsmeeee</italic>, the experts are stated to be health professionals verified by the subreddit moderators. In a way, these accounts are analogous to the quantified influence described in the study by Koo et al [<xref ref-type="bibr" rid="ref37">37</xref>] and the power accounts in the study by Sugawara et al [<xref ref-type="bibr" rid="ref38">38</xref>], showing that, similarly to Twitter, medical advice about testing and diagnosis may be heavily influenced by several accounts on Reddit.</p>
        <p><italic>r/askdocs</italic> has approximately 270,000 members, whereas <italic>r/askdoctorsmeeee</italic> currently has approximately 14,400 members. In these subreddits, the most prevalent topics were similar to those found in other subreddits. We believe that many people turn to these forums for advice and that these subreddits are representative of the kinds of conversations that users have elsewhere on the site. However, because of the availability of experts on certain subreddits, Reddit users may be more discerning about the type of advice they expect to receive.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>We initially wanted to determine whether there was any correlation between medical topics that were mentioned on Reddit and medical tests that were mentioned on Reddit. However, our review of the Reddit posts demonstrated that users, in general, did not always mention specific medical tests, instead referring or alluding to a medical condition or a broad class of diseases, such as autoimmune diseases or STIs. At times, the content of a post would simply talk about “something being wrong,” making it difficult to classify into a topic.</p>
        <p>We noted other limitations, some of which we were able to address. Some posts were included that only had phrases such as “you should get that checked out,” which were too vague to categorize under any topic. However, this problem was mitigated by using posts only from the 95 subreddits, where the frequency of such comments was lower. This was because those select subreddits, being more focused on their specific diseases or topics, had fewer vague comments and tended to have more thoughtful, directed discussion.</p>
        <p>It is possible that keyword selection introduced bias into our topic assignments. For example, for the topic of benign prostatic hypertrophy, keywords included “difficulty urinating” and “difficulty peeing,” but these keywords could have also been applicable to a topic such as nephrology (unspecified). However, we mitigated these biases by having multiple reviewers with backgrounds in clinical medicine and correlating our topic assignments with words in UpToDate. This ensured that the keywords we chose would lead to the least overlap between topics.</p>
        <p>We also noted that some posts had too much jargon to be easily classifiable into any one topic. In future studies, they should be categorized in the <italic>nonmedical</italic> topic. Some posts, upon manual review, covered multiple health topics. These were the most difficult posts of all. As our algorithm did not have a way of tagging posts with multiple topics, these posts were assigned to only 1 topic. Future refinement of our algorithm could create a tagging system to identify all the major topics in a post, thereby circumventing this issue.</p>
      </sec>
      <sec>
        <title>Future Applications</title>
        <p>Our study provides insights into health discussions on Reddit. Our results are generalizable to other social media platforms. Facebook groups and Twitter hashtags allow for topic-based forums where people can find community discussion on health issues similarly to subreddits. Previous studies on Facebook and Twitter topic analyses have shown that social media data can be collected to better understand public sentiment on specific health topics [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]. The topic analysis methods we outlined could be applied to other social media platforms, which may show differences in what topics are discussed. Therefore, future platform-wide studies are needed.</p>
        <p>We found that topics such as STIs and mental health issues are especially prevalent. These are potentially subjects that patients are not often discussing with their health care providers. As previously discussed, people tend to avoid potentially stigmatizing, embarrassing, and uncomfortable conversation topics, and STIs and mental health often entail such feelings. Therefore, our findings reinforce the need for health care systems to have open discussions about these issues. Health care providers establish a framework for these conversations through currently available questionnaires. The Patient Health Questionnaire–9 is a tool that providers can use to assess for depressive symptoms and mood. Asking for a sexual history during patient visits using the 5 P approach (partners, practices, protection from STIs, past history of STIs, and pregnancy) is a systematic way of starting a conversation about a patient’s sexual history and concerns about STIs and pregnancy, topics that were found to be prevalent in our study. In addition, prior work has shown that, when patients seek health information online, the patient-physician relationship can be improved if the physician asks about this information and discusses it with the patient [<xref ref-type="bibr" rid="ref41">41</xref>]. Our study supports that physicians and patients should discuss health information that the patient finds online.</p>
        <p>Health-related discussions on social media and their effects on health policy remain an active area of research. Broadly, health-related discussions on social media have been cited as a potential impactor on disease surveillance and health care policy, practices, and delivery [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. More recently, the relationship between social media and health policies has been extensively discussed in contexts such as COVID-19 [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref44">44</xref>] and mental health [<xref ref-type="bibr" rid="ref45">45</xref>-<xref ref-type="bibr" rid="ref49">49</xref>]. Further studies on the impact of social media on health interventions and health outcomes are needed [<xref ref-type="bibr" rid="ref40">40</xref>]. It has been suggested that social media can play a role in health policy beyond increasing awareness of health issues [<xref ref-type="bibr" rid="ref50">50</xref>]. Given the volume and wide variety of health topics discussed on Reddit, future health policies may need to address prevalent beliefs promulgated by health-related discussions on social media sites. Guarding against health misinformation remains an important issue on social media and an active area of study [<xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref53">53</xref>]. Therefore, we support policies that encourage informed use of social media and discourage the spread of misinformation. Governance and education about obtaining health information online is crucial.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>To investigate how people use Reddit to talk about seeking medical advice, we conducted a targeted review of posts that talked about “getting tested” and “checked out.” Using an inductive approach to sort these posts into different medical topics, we found that discussion centered on several medical topics. They were further grouped into medical disciplines, and the infectious disease, reproductive, mental health, and endocrine categories had the greatest prevalence.</p>
        <p>Reddit proved to be conducive to gathering information on what people discuss when talking about getting checked or tested. We took a platform-wide approach to this study, aiming to examine posts from a spectrum of subreddits related to health care and medicine. We believe that this approach is unique as it aimed to classify posts into all possible medical disciplines. In addition, based on our review of the literature, this is also one of the few studies conducted on Reddit to understand health discussions. Reddit provides similar advantages to those of other social media platforms in its large user base, wealth of information, and exchange of ideas. However, Reddit is additionally useful for studying communication about health concerns because of several of its features. Subreddits provide structured forums to further sort where discussions are happening on the platform. Several subreddits feature “expert” users, fostering a question-and-answer culture. Most importantly, users may favor Reddit because of its anonymity, which allows them to ask about and discuss potentially embarrassing topics in detail. In this way, Reddit’s unique features prove it to be a viable source of research information that is worth exploring.</p>
        <p>This study was a preliminary examination of the discussions occurring on Reddit. Future work on Reddit would likely take a more focused approach. Further exploration would include answering specific questions about certain topics encountered on Reddit and their prevalence in certain subreddits. Ultimately, these findings could be translated into actionable items, such as improving physician-patient interactions and laboratory management practices. Overall, the culture, structure, and wealth of information on Reddit make it a valuable source for continued investigation of health-related discussions.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Analysis of our Reddit dataset.</p>
        <media xlink:href="formative_v9i1e55309_app1.docx" xlink:title="DOCX File , 156 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ADHD</term>
          <def>
            <p>attention-deficit/hyperactivity disorder</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">
            <italic>ICD-10</italic>
          </term>
          <def>
            <p>
              <italic>International Classification of Diseases, 10th Revision</italic>
            </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">STI</term>
          <def>
            <p>sexually transmitted infection</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors would like to thank the Department of Pathology and Laboratory Medicine at the University of Vermont Robert Larner College of Medicine and the RAND Corporation for their support. No generative artificial intelligence was used in the writing of this manuscript.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The datasets generated and analyzed during this study are available at the Reddit_public_data repository [<xref ref-type="bibr" rid="ref54">54</xref>].</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <source>We Are Social</source>
          <access-date>2020-01-30</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://wearesocial.com/blog/2020/01/digital-2020-3-8-billion-people-usesocial-media">https://wearesocial.com/blog/2020/01/digital-2020-3-8-billion-people-usesocial-media</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sohn</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Cultural difference in motivations for using social network sites: a comparative study of American and Korean college students</article-title>
          <source>Comput Hum Behav</source>
          <year>2011</year>
          <month>1</month>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>365</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1016/j.chb.2010.08.015</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Whiting</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Why people use social media: a uses and gratifications approach</article-title>
          <source>Qual Mark Res</source>
          <year>2013</year>
          <month>08</month>
          <day>30</day>
          <volume>16</volume>
          <issue>4</issue>
          <fpage>362</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1108/QMR-06-2013-0041</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Moturu</surname>
              <given-names>ST</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Quantifying utility and trustworthiness for advice shared on online social media</article-title>
          <source>Proceedings of the International Conference on Computational Science and Engineering</source>
          <year>2009</year>
          <conf-name>CSE 2009</conf-name>
          <conf-date>August 29-31, 2009</conf-date>
          <conf-loc>Vancouver, BC</conf-loc>
          <pub-id pub-id-type="doi">10.1109/CSE.2009.461</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Joinson</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Social desirability, anonymity, and internet-based questionnaires</article-title>
          <source>Behav Res Methods Instrum Comput</source>
          <year>1999</year>
          <month>9</month>
          <volume>31</volume>
          <fpage>433</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.3758/BF03200723</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stephens-Davidowitz</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <source>Everybody Lies: Big Data, New Data, and What the Internet Can Tell Us About Who We Really Are</source>
          <year>2017</year>
          <publisher-loc>New York City, NY</publisher-loc>
          <publisher-name>William Morrow</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berger</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Milkman</surname>
              <given-names>KL</given-names>
            </name>
          </person-group>
          <article-title>What makes online content viral?</article-title>
          <source>J Mark Res</source>
          <year>2012</year>
          <month>04</month>
          <day>01</day>
          <volume>49</volume>
          <issue>2</issue>
          <fpage>192</fpage>
          <lpage>205</lpage>
          <pub-id pub-id-type="doi">10.1509/jmr.10.0353</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shatz</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Fast, free, and targeted: Reddit as a source for recruiting participants online</article-title>
          <source>Soc Sci Comput Rev</source>
          <year>2016</year>
          <month>05</month>
          <day>19</day>
          <volume>35</volume>
          <issue>4</issue>
          <fpage>537</fpage>
          <lpage>49</lpage>
          <pub-id pub-id-type="doi">10.1177/0894439316650163</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kubina</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Varmus</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kubinova</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Use of big data for competitive advantage of company</article-title>
          <source>Procedia Econ Financ</source>
          <year>2015</year>
          <volume>26</volume>
          <fpage>561</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1016/s2212-5671(15)00955-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Robards</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Hardy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bennett</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Robards</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Belonging and neo-tribalism on social media site Reddit</article-title>
          <source>Neo-Tribes</source>
          <year>2018</year>
          <month>09</month>
          <day>29</day>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Palgrave Macmillan</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="web">
          <article-title>Reddit statistics For 2024 (Demographics, usage and traffic data)</article-title>
          <source>Foundation Marketing</source>
          <access-date>2022-09-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://foundationinc.co/lab/reddit-statistics/">https://foundationinc.co/lab/reddit-statistics/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="web">
          <article-title>Amazon Alexa</article-title>
          <source>Amazon Web Services</source>
          <access-date>2022-09-13</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.alexa.com/siteinfo/reddit.com#card_overlap">https://www.alexa.com/siteinfo/reddit.com#card_overlap</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Social media for opioid addiction epidemiology: automatic detection of opioid addicts from Twitter and case studies</article-title>
          <source>Proceedings of the 2017 ACM on Conference on Information and Knowledge Management</source>
          <year>2017</year>
          <conf-name>CIKM '17</conf-name>
          <conf-date>November 6-10, 2017</conf-date>
          <conf-loc>Singapore, Singapore</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3132847.3132857</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>De la Torre-Díez</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Díaz-Pernas</surname>
              <given-names>FJ</given-names>
            </name>
            <name name-style="western">
              <surname>Antón-Rodríguez</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A content analysis of chronic diseases social groups on Facebook and Twitter</article-title>
          <source>Telemed J E Health</source>
          <year>2012</year>
          <volume>18</volume>
          <issue>6</issue>
          <fpage>404</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1089/tmj.2011.0227</pub-id>
          <pub-id pub-id-type="medline">22650380</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prieto</surname>
              <given-names>VM</given-names>
            </name>
            <name name-style="western">
              <surname>Matos</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Álvarez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cacheda</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Oliveira</surname>
              <given-names>JL</given-names>
            </name>
          </person-group>
          <article-title>Twitter: a good place to detect health conditions</article-title>
          <source>PLoS One</source>
          <year>2014</year>
          <month>01</month>
          <day>29</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>e86191</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0086191"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0086191</pub-id>
          <pub-id pub-id-type="medline">24489699</pub-id>
          <pub-id pub-id-type="pii">PONE-D-13-10567</pub-id>
          <pub-id pub-id-type="pmcid">PMC3906034</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Depression detection on Reddit with an emotion-based attention network: algorithm development and validation</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>07</month>
          <day>16</day>
          <volume>9</volume>
          <issue>7</issue>
          <fpage>e28754</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/7/e28754/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/28754</pub-id>
          <pub-id pub-id-type="medline">34269683</pub-id>
          <pub-id pub-id-type="pii">v9i7e28754</pub-id>
          <pub-id pub-id-type="pmcid">PMC8325087</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rashidian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Duanmu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rosenthal</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Detection of suicidality among opioid users on Reddit: machine learning-based approach</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>11</month>
          <day>27</day>
          <volume>22</volume>
          <issue>11</issue>
          <fpage>e15293</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/11/e15293/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/15293</pub-id>
          <pub-id pub-id-type="medline">33245287</pub-id>
          <pub-id pub-id-type="pii">v22i11e15293</pub-id>
          <pub-id pub-id-type="pmcid">PMC7732714</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Understanding weight loss via online discussions: content analysis of Reddit posts using topic modeling and word clustering techniques</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>06</month>
          <day>08</day>
          <volume>22</volume>
          <issue>6</issue>
          <fpage>e13745</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/6/e13745/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13745</pub-id>
          <pub-id pub-id-type="medline">32510460</pub-id>
          <pub-id pub-id-type="pii">v22i6e13745</pub-id>
          <pub-id pub-id-type="pmcid">PMC7308899</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Crutchley</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Preoţiuc-Pietro</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Asch</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
          </person-group>
          <article-title>Facebook language predicts depression in medical records</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2018</year>
          <month>10</month>
          <day>30</day>
          <volume>115</volume>
          <issue>44</issue>
          <fpage>11203</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.pnas.org/doi/abs/10.1073/pnas.1802331115?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.1802331115</pub-id>
          <pub-id pub-id-type="medline">30322910</pub-id>
          <pub-id pub-id-type="pii">1802331115</pub-id>
          <pub-id pub-id-type="pmcid">PMC6217418</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Asch</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Crutchley</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Guntuku</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Padrez</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the predictability of medical conditions from social media posts</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <month>6</month>
          <day>17</day>
          <volume>14</volume>
          <issue>6</issue>
          <fpage>e0215476</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0215476"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0215476</pub-id>
          <pub-id pub-id-type="medline">31206534</pub-id>
          <pub-id pub-id-type="pii">PONE-D-18-34864</pub-id>
          <pub-id pub-id-type="pmcid">PMC6576767</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
          <article-title>Ways to become a moderator</article-title>
          <source>Reddit</source>
          <access-date>2023-02-28</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mods.reddithelp.com/hc/en-us/articles/360001745332-Ways-to-become-a-moderator">https://mods.reddithelp.com/hc/en-us/articles/360001745332-Ways-to-become-a-moderator</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Conway</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>AT</given-names>
            </name>
          </person-group>
          <article-title>Examining thematic similarity, difference, and membership in three online mental health communities from reddit: a text mining and visualization approach</article-title>
          <source>Comput Human Behav</source>
          <year>2018</year>
          <month>01</month>
          <volume>78</volume>
          <fpage>98</fpage>
          <lpage>112</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29456286"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.chb.2017.09.001</pub-id>
          <pub-id pub-id-type="medline">29456286</pub-id>
          <pub-id pub-id-type="pmcid">PMC5810583</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="web">
          <article-title>reddit - search results - PubMed</article-title>
          <source>PubMed</source>
          <access-date>2022-09-14</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pubmed.ncbi.nlm.nih.gov/?term=reddit&amp;sort_order=asc&amp;size=200">https://pubmed.ncbi.nlm.nih.gov/?term=reddit&amp;sort_order=asc&amp;size=200</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="web">
          <article-title>The ICD-10 classification of mental and behavioural disorders : diagnostic criteria for research</article-title>
          <source>World Health Organization</source>
          <access-date>2022-12-03</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://iris.who.int/handle/10665/37108">https://iris.who.int/handle/10665/37108</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="web">
          <article-title>UpToDate: trusted, evidence-based solutions for modern healthcare</article-title>
          <source>Wolters Kluwer</source>
          <access-date>2023-07-15</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.wolterskluwer.com/en/solutions/uptodate">https://www.wolterskluwer.com/en/solutions/uptodate</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wickham</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Averick</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bryan</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>McGowan</surname>
              <given-names>LD</given-names>
            </name>
            <name name-style="western">
              <surname>François</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Grolemund</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Hayes</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Henry</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hester</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kuhn</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pedersen</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Bache</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Müller</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ooms</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Seidel</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Spinu</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Vaughan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wilke</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Woo</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yutani</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Welcome to the Tidyverse</article-title>
          <source>J Open Source Softw</source>
          <year>2019</year>
          <month>11</month>
          <day>21</day>
          <volume>4</volume>
          <issue>43</issue>
          <fpage>1686</fpage>
          <pub-id pub-id-type="doi">10.21105/joss.01686</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Foufi</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Timakum</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Gaudet-Blavignac</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lovis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Mining of textual health information from Reddit: analysis of chronic diseases with extracted entities and their relations</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>06</month>
          <day>13</day>
          <volume>21</volume>
          <issue>6</issue>
          <fpage>e12876</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/6/e12876/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12876</pub-id>
          <pub-id pub-id-type="medline">31199327</pub-id>
          <pub-id pub-id-type="pii">v21i6e12876</pub-id>
          <pub-id pub-id-type="pmcid">PMC6595941</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nowak</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Parker</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Gidengil</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Matthews</surname>
              <given-names>LJ</given-names>
            </name>
          </person-group>
          <article-title>Comparing covariation among vaccine hesitancy and broader beliefs within Twitter and survey data</article-title>
          <source>PLoS One</source>
          <year>2020</year>
          <month>10</month>
          <day>8</day>
          <volume>15</volume>
          <issue>10</issue>
          <fpage>e0239826</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0239826"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0239826</pub-id>
          <pub-id pub-id-type="medline">33031405</pub-id>
          <pub-id pub-id-type="pii">PONE-D-20-09839</pub-id>
          <pub-id pub-id-type="pmcid">PMC7544030</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eldh</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Årestedt</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Berterö</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Quotations in qualitative studies: reflections on constituents, custom, and purpose</article-title>
          <source>Int J Qual Methods</source>
          <year>2020</year>
          <month>11</month>
          <day>02</day>
          <volume>19</volume>
          <fpage>1</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1177/1609406920969268</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patton</surname>
              <given-names>MQ</given-names>
            </name>
          </person-group>
          <source>Qualitative Research &amp; Evaluation Methods: Integrating Theory and Practice</source>
          <year>2014</year>
          <publisher-loc>Thousand Oaks, CA</publisher-loc>
          <publisher-name>SAGE Publications</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Roman</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rodriguez-Arrastia</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Molina-Torres</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Márquez-Hernández</surname>
              <given-names>VV</given-names>
            </name>
            <name name-style="western">
              <surname>Gutiérrez-Puertas</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ropero-Padilla</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>The escape room as evaluation method: a qualitative study of nursing students' experiences</article-title>
          <source>Med Teach</source>
          <year>2020</year>
          <month>04</month>
          <volume>42</volume>
          <issue>4</issue>
          <fpage>403</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.1080/0142159X.2019.1687865</pub-id>
          <pub-id pub-id-type="medline">31738615</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Du</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Moskowitz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lucioni</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kobashi</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>UJ</given-names>
            </name>
          </person-group>
          <article-title>I leaked, then I Reddit: experiences and insight shared on urinary incontinence by Reddit users</article-title>
          <source>Int Urogynecol J</source>
          <year>2020</year>
          <month>02</month>
          <volume>31</volume>
          <issue>2</issue>
          <fpage>243</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1007/s00192-019-04165-8</pub-id>
          <pub-id pub-id-type="medline">31832718</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00192-019-04165-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stuart</surname>
              <given-names>GS</given-names>
            </name>
            <name name-style="western">
              <surname>Grimes</surname>
              <given-names>DA</given-names>
            </name>
          </person-group>
          <article-title>Social desirability bias in family planning studies: a neglected problem</article-title>
          <source>Contraception</source>
          <year>2009</year>
          <month>08</month>
          <volume>80</volume>
          <issue>2</issue>
          <fpage>108</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1016/j.contraception.2009.02.009</pub-id>
          <pub-id pub-id-type="medline">19631784</pub-id>
          <pub-id pub-id-type="pii">S0010-7824(09)00072-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Morisky</surname>
              <given-names>DE</given-names>
            </name>
            <name name-style="western">
              <surname>Ang</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sneed</surname>
              <given-names>CD</given-names>
            </name>
          </person-group>
          <article-title>Validating the effects of social desirability on self-reported condom use behavior among commercial sex workers</article-title>
          <source>AIDS Educ Prev</source>
          <year>2002</year>
          <month>10</month>
          <volume>14</volume>
          <issue>5</issue>
          <fpage>351</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1521/aeap.14.6.351.24078</pub-id>
          <pub-id pub-id-type="medline">12413181</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Thake</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vilhena</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Social desirability biases in self-reported alcohol consumption and harms</article-title>
          <source>Addict Behav</source>
          <year>2010</year>
          <month>04</month>
          <volume>35</volume>
          <issue>4</issue>
          <fpage>302</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1016/j.addbeh.2009.11.001</pub-id>
          <pub-id pub-id-type="medline">19932936</pub-id>
          <pub-id pub-id-type="pii">S0306-4603(09)00307-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Crutzen</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Portugal</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Fisser</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Grolleman</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>An artificially intelligent chat agent that answers adolescents' questions related to sex, drugs, and alcohol: an exploratory study</article-title>
          <source>J Adolesc Health</source>
          <year>2011</year>
          <month>05</month>
          <volume>48</volume>
          <issue>5</issue>
          <fpage>514</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jadohealth.2010.09.002</pub-id>
          <pub-id pub-id-type="medline">21501812</pub-id>
          <pub-id pub-id-type="pii">S1054-139X(10)00430-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Koo</surname>
              <given-names>PK</given-names>
            </name>
            <name name-style="western">
              <surname>Majdandzic</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ploenzke</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Anand</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Paul</surname>
              <given-names>SB</given-names>
            </name>
          </person-group>
          <article-title>Global importance analysis: an interpretability method to quantify importance of genomic features in deep neural networks</article-title>
          <source>PLoS Comput Biol</source>
          <year>2021</year>
          <month>05</month>
          <day>13</day>
          <volume>17</volume>
          <issue>5</issue>
          <fpage>e1008925</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pcbi.1008925"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pcbi.1008925</pub-id>
          <pub-id pub-id-type="medline">33983921</pub-id>
          <pub-id pub-id-type="pii">PCOMPBIOL-D-20-01489</pub-id>
          <pub-id pub-id-type="pmcid">PMC8118286</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sugawara</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Narimatsu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Hozawa</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Otani</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fukao</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Cancer patients on Twitter: a novel patient community on social media</article-title>
          <source>BMC Res Notes</source>
          <year>2012</year>
          <month>12</month>
          <day>27</day>
          <volume>5</volume>
          <fpage>699</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcresnotes.biomedcentral.com/articles/10.1186/1756-0500-5-699"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1756-0500-5-699</pub-id>
          <pub-id pub-id-type="medline">23270426</pub-id>
          <pub-id pub-id-type="pii">1756-0500-5-699</pub-id>
          <pub-id pub-id-type="pmcid">PMC3599295</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Monselise</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Ferreira</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>CC</given-names>
            </name>
          </person-group>
          <article-title>Topics and sentiments of public concerns regarding COVID-19 vaccines: social media trend analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>10</month>
          <day>21</day>
          <volume>23</volume>
          <issue>10</issue>
          <fpage>e30765</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/10/e30765/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/30765</pub-id>
          <pub-id pub-id-type="medline">34581682</pub-id>
          <pub-id pub-id-type="pii">v23i10e30765</pub-id>
          <pub-id pub-id-type="pmcid">PMC8534488</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Valdez</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Ten Thij</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bathina</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Rutter</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Bollen</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Social media insights into US mental health during the COVID-19 pandemic: longitudinal analysis of Twitter data</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>12</month>
          <day>14</day>
          <volume>22</volume>
          <issue>12</issue>
          <fpage>e21418</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/12/e21418/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/21418</pub-id>
          <pub-id pub-id-type="medline">33284783</pub-id>
          <pub-id pub-id-type="pii">v22i12e21418</pub-id>
          <pub-id pub-id-type="pmcid">PMC7744146</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Goonawardene</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Internet health information seeking and the patient-physician relationship: a systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>01</month>
          <day>19</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>e9</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/1/e9/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.5729</pub-id>
          <pub-id pub-id-type="medline">28104579</pub-id>
          <pub-id pub-id-type="pii">v19i1e9</pub-id>
          <pub-id pub-id-type="pmcid">PMC5290294</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Social media use for health purposes: systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>05</month>
          <day>12</day>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>e17917</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/5/e17917/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/17917</pub-id>
          <pub-id pub-id-type="medline">33978589</pub-id>
          <pub-id pub-id-type="pii">v23i5e17917</pub-id>
          <pub-id pub-id-type="pmcid">PMC8156131</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patrick</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Venkatesh</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Stukus</surname>
              <given-names>DR</given-names>
            </name>
          </person-group>
          <article-title>Social media and its impact on health care</article-title>
          <source>Ann Allergy Asthma Immunol</source>
          <year>2022</year>
          <month>02</month>
          <volume>128</volume>
          <issue>2</issue>
          <fpage>139</fpage>
          <lpage>45</lpage>
          <pub-id pub-id-type="doi">10.1016/j.anai.2021.09.014</pub-id>
          <pub-id pub-id-type="medline">34555532</pub-id>
          <pub-id pub-id-type="pii">S1081-1206(21)01053-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>CY</given-names>
            </name>
            <name name-style="western">
              <surname>Broström</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Griffiths</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Pakpour</surname>
              <given-names>AH</given-names>
            </name>
          </person-group>
          <article-title>Investigating mediated effects of fear of COVID-19 and COVID-19 misunderstanding in the association between problematic social media use, psychological distress, and insomnia</article-title>
          <source>Internet Interv</source>
          <year>2020</year>
          <month>09</month>
          <volume>21</volume>
          <fpage>100345</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2214-7829(20)30111-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.invent.2020.100345</pub-id>
          <pub-id pub-id-type="medline">32868992</pub-id>
          <pub-id pub-id-type="pii">S2214-7829(20)30111-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC7449889</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Latha</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Meena</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Pravitha</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Dasgupta</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chaturvedi</surname>
              <given-names>SK</given-names>
            </name>
          </person-group>
          <article-title>Effective use of social media platforms for promotion of mental health awareness</article-title>
          <source>J Educ Health Promot</source>
          <year>2020</year>
          <month>05</month>
          <day>28</day>
          <volume>9</volume>
          <fpage>124</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32642480"/>
          </comment>
          <pub-id pub-id-type="doi">10.4103/jehp.jehp_90_20</pub-id>
          <pub-id pub-id-type="medline">32642480</pub-id>
          <pub-id pub-id-type="pii">JEHP-9-124</pub-id>
          <pub-id pub-id-type="pmcid">PMC7325786</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mazuz</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yom-Tov</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Analyzing trends of loneliness through large-scale analysis of social media postings: observational study</article-title>
          <source>JMIR Ment Health</source>
          <year>2020</year>
          <month>04</month>
          <day>20</day>
          <volume>7</volume>
          <issue>4</issue>
          <fpage>e17188</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2020/4/e17188/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/17188</pub-id>
          <pub-id pub-id-type="medline">32310141</pub-id>
          <pub-id pub-id-type="pii">v7i4e17188</pub-id>
          <pub-id pub-id-type="pmcid">PMC7199140</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Onyeaka</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Firth</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ajayi</surname>
              <given-names>KV</given-names>
            </name>
            <name name-style="western">
              <surname>Muoghalu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Holmes</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nkemjika</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Adeolu</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Anugwom</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Eseaton</surname>
              <given-names>PO</given-names>
            </name>
            <name name-style="western">
              <surname>Onyeaka</surname>
              <given-names>NC</given-names>
            </name>
            <name name-style="western">
              <surname>Huffman</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Torous</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Association between social media use and health promotion among individuals with depression and anxiety: insights from the 2017–2020 Health Information National Trends Survey</article-title>
          <source>J Mood Anxiety Disord</source>
          <year>2023</year>
          <month>06</month>
          <volume>1</volume>
          <fpage>100006</fpage>
          <pub-id pub-id-type="doi">10.1016/j.xjmad.2023.100006</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Plackett</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Blyth</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schartau</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>The impact of social media use interventions on mental well-being: systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2023</year>
          <month>08</month>
          <day>11</day>
          <volume>25</volume>
          <fpage>e44922</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2023//e44922/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/44922</pub-id>
          <pub-id pub-id-type="medline">37565693</pub-id>
          <pub-id pub-id-type="pii">v25i1e44922</pub-id>
          <pub-id pub-id-type="pmcid">PMC10457695</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vandenbosch</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Fardouly</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tiggemann</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Social media and body image: recent trends and future directions</article-title>
          <source>Curr Opin Psychol</source>
          <year>2022</year>
          <month>06</month>
          <volume>45</volume>
          <fpage>101289</fpage>
          <pub-id pub-id-type="doi">10.1016/j.copsyc.2021.12.002</pub-id>
          <pub-id pub-id-type="medline">35030460</pub-id>
          <pub-id pub-id-type="pii">S2352-250X(21)00241-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ghahramani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>de Courten</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Prokofieva</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>"The potential of social media in health promotion beyond creating awareness: an integrative review"</article-title>
          <source>BMC Public Health</source>
          <year>2022</year>
          <month>12</month>
          <day>21</day>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>2402</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-022-14885-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12889-022-14885-0</pub-id>
          <pub-id pub-id-type="medline">36544121</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12889-022-14885-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC9770563</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allcott</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Boxell</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Conway</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gentzkow</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Thaler</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Polarization and public health: partisan differences in social distancing during the coronavirus pandemic</article-title>
          <source>J Public Econ</source>
          <year>2020</year>
          <month>11</month>
          <volume>191</volume>
          <fpage>104254</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32836504"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jpubeco.2020.104254</pub-id>
          <pub-id pub-id-type="medline">32836504</pub-id>
          <pub-id pub-id-type="pii">104254</pub-id>
          <pub-id pub-id-type="pmcid">PMC7409721</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Suarez-Lledo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Alvarez-Galvez</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Prevalence of health misinformation on social media: systematic review</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>01</month>
          <day>20</day>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>e17187</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/1/e17187/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/17187</pub-id>
          <pub-id pub-id-type="medline">33470931</pub-id>
          <pub-id pub-id-type="pii">v23i1e17187</pub-id>
          <pub-id pub-id-type="pmcid">PMC7857950</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Togher</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Health misinformation on social media and adolescent health</article-title>
          <source>JAMA Pediatr</source>
          <year>2024</year>
          <month>02</month>
          <day>01</day>
          <volume>178</volume>
          <issue>2</issue>
          <fpage>109</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.1001/jamapediatrics.2023.5282</pub-id>
          <pub-id pub-id-type="medline">38079180</pub-id>
          <pub-id pub-id-type="pii">2812569</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="web">
          <article-title>Reddit_data_public</article-title>
          <source>Google Drive</source>
          <access-date>2025-01-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://drive.google.com/drive/folders/1gkyl8COxEeumbMZP-CFa2cbBnV1pNGt1">https://drive.google.com/drive/folders/1gkyl8COxEeumbMZP-CFa2cbBnV1pNGt1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
