<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JFR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id>
      <journal-title>JMIR Formative Research</journal-title>
      <issn pub-type="epub">2561-326X</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i1e49031</article-id>
      <article-id pub-id-type="pmid">38265858</article-id>
      <article-id pub-id-type="doi">10.2196/49031</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Use of Machine Learning Tools in Evidence Synthesis of Tobacco Use Among Sexual and Gender Diverse Populations: Algorithm Development and Validation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chavez</surname>
            <given-names>Alexis</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Matsuda</surname>
            <given-names>Shinichi</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Ma</surname>
            <given-names>Shaoying</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Center for Tobacco Research</institution>
            <institution>The Ohio State University Comprehensive Cancer Center</institution>
            <addr-line>3650 Olentangy River Road</addr-line>
            <addr-line>1st Floor, Suite 110</addr-line>
            <addr-line>Columbus, OH, 43214</addr-line>
            <country>United States</country>
            <phone>1 6148976063</phone>
            <email>shaoying.ma@osumc.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6086-0622</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Jiang</surname>
            <given-names>Shuning</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6706-2818</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Olivia</given-names>
          </name>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0003-5690-9539</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Xuanzhi</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0001-0854-8746</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Fu</surname>
            <given-names>Yu</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8477-8888</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Yusen</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0009-6001-6809</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Kaareen</surname>
            <given-names>Aadeeba</given-names>
          </name>
          <degrees>BSocSci</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0002-3999-0294</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Ling</surname>
            <given-names>Meng</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6597-5448</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Chen</surname>
            <given-names>Jian</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1599-0831</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <name name-style="western">
            <surname>Shang</surname>
            <given-names>Ce</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8838-4250</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Center for Tobacco Research</institution>
        <institution>The Ohio State University Comprehensive Cancer Center</institution>
        <addr-line>Columbus, OH</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Computer Science and Engineering</institution>
        <institution>The Ohio State University</institution>
        <addr-line>Columbus, OH</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Shaoying Ma <email>shaoying.ma@osumc.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>24</day>
        <month>1</month>
        <year>2024</year>
      </pub-date>
      <volume>8</volume>
      <elocation-id>e49031</elocation-id>
      <history>
        <date date-type="received">
          <day>15</day>
          <month>5</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>20</day>
          <month>8</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>6</day>
          <month>12</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>29</day>
          <month>12</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Shaoying Ma, Shuning Jiang, Olivia Yang, Xuanzhi Zhang, Yu Fu, Yusen Zhang, Aadeeba Kaareen, Meng Ling, Jian Chen, Ce Shang. Originally published in JMIR Formative Research (https://formative.jmir.org), 24.01.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on https://formative.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://formative.jmir.org/2024/1/e49031" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>From 2016 to 2021, the volume of peer-reviewed publications related to tobacco has experienced a significant increase. This presents a considerable challenge in efficiently summarizing, synthesizing, and disseminating research findings, especially when it comes to addressing specific target populations, such as the LGBTQ+ (lesbian, gay, bisexual, transgender, queer, intersex, asexual, Two Spirit, and other persons who identify as part of this community) populations.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>In order to expedite evidence synthesis and research gap discoveries, this pilot study has the following three aims: (1) to compile a specialized semantic database for tobacco policy research to extract information from journal article abstracts, (2) to develop natural language processing (NLP) algorithms that comprehend the literature on nicotine and tobacco product use among sexual and gender diverse populations, and (3) to compare the discoveries of the NLP algorithms with an ongoing systematic review of tobacco policy research among LGBTQ+ populations.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We built a tobacco research domain–specific semantic database using data from 2993 paper abstracts from 4 leading tobacco-specific journals, with enrichment from other publicly available sources. We then trained an NLP model to extract named entities after learning patterns and relationships between words and their context in text, which further enriched the semantic database. Using this iterative process, we extracted and assessed studies relevant to LGBTQ+ tobacco control issues, further comparing our findings with an ongoing systematic review that also focuses on evidence synthesis for this demographic group.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>In total, 33 studies were identified as relevant to sexual and gender diverse individuals’ nicotine and tobacco product use. Consistent with the ongoing systematic review, the NLP results showed that there is a scarcity of studies assessing policy impact on this demographic using causal inference methods. In addition, the literature is dominated by US data. We found that the product drawing the most attention in the body of existing research is cigarettes or cigarette smoking and that the number of studies of various age groups is almost evenly distributed between youth or young adults and adults, consistent with the research needs identified by the US health agencies.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our pilot study serves as a compelling demonstration of the capabilities of NLP tools in expediting the processes of evidence synthesis and the identification of research gaps. While future research is needed to statistically test the NLP tool’s performance, there is potential for NLP tools to fundamentally transform the approach to evidence synthesis.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>machine learning</kwd>
        <kwd>natural language processing</kwd>
        <kwd>tobacco control</kwd>
        <kwd>sexual and gender diverse populations</kwd>
        <kwd>lesbian</kwd>
        <kwd>gay</kwd>
        <kwd>bisexual</kwd>
        <kwd>transgender</kwd>
        <kwd>queer</kwd>
        <kwd>LGBTQ+</kwd>
        <kwd>evidence synthesis</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>The use of nicotine or tobacco products is a leading preventable cause of cancer, heart diseases, and lung diseases in the United States [<xref ref-type="bibr" rid="ref1">1</xref>], with cigarette smoking alone responsible for the death of half a million Americans each year [<xref ref-type="bibr" rid="ref2">2</xref>]. Notably, sexual and gender diverse individuals, often referred to as the LGBTQ+ (lesbian, gay, bisexual, transgender, queer, intersex, asexual, Two Spirit, and other persons who identify as part of this community) populations, are particularly vulnerable to nicotine and tobacco product use [<xref ref-type="bibr" rid="ref3">3</xref>]. Both the National Cancer Institute and the Centers for Disease Control and Prevention have recognized the LGBTQ+ populations as a critical target in their efforts to combat tobacco use disparities [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref10">10</xref>].</p>
      <p>In response to the pressing need for tobacco control and the rapidly evolving landscape of the tobacco market, the National Institutes of Health (NIH) and other health foundations, including the American Cancer Society, have made substantial investments in tobacco control research and tobacco regulatory science [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. According to our calculations using data from the NIH era reporter, funding for tobacco research has shown a remarkable increase, growing from US $7.7 billion in 2016 to US $11.2 billion in 2021 (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> [<xref ref-type="bibr" rid="ref13">13</xref>]). Consequently, the volume of peer-reviewed publications related to tobacco has experienced a significant increase. This presents a considerable challenge in efficiently summarizing, synthesizing, and disseminating research findings, especially when it comes to addressing specific target populations, such as the LGBTQ+ populations.</p>
      <p>One promising pathway to rapidly assessing the expanding body of literature is the use of natural language processing (NLP) models. NLP is dedicated to deciphering and comprehending how computers interpret human language, equipping them to analyze extensive data sets of natural language [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. While NLP tools have garnered considerable recognition in biomedical research [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref10">10</xref>], aiding in tasks such as disease surveillance (eg, COVID-19) and diagnosing using medical records [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref23">23</xref>], their potential to expedite near real-time synthesis of evidence in tobacco control research remains untapped [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
      <p>Another gap in existing NLP tools is the lack of applications in synthesizing social science research and modeling. A noteworthy example in the domain of tobacco research is the evaluation of the effectiveness of tobacco control policies, which are often assessed using complex statistical modelling and large-scale survey data. These methods demand a specialized semantic database for labelling studies and interpreting results. However, to the best of knowledge, such a semantic database has not been developed yet. Considering that policy interventions at federal, state, and local levels are designed to reach a large number of populations, the lack of a database to facilitate NLP applications may significantly undermine evidence synthesis and thereby the timely adoption of effective policies [<xref ref-type="bibr" rid="ref25">25</xref>].</p>
      <p>Furthermore, in light of the calls from entities such as the NIH and other health agencies to address tobacco use disparities within priority populations, including LGBTQ+ populations, the development NLP tools to aid in the discovery of effective policies tailored to these special populations remains uncharted territory [<xref ref-type="bibr" rid="ref26">26</xref>-<xref ref-type="bibr" rid="ref31">31</xref>]. There is an urgent demand for the development of NLP tools (eg, semantic database, NLP algorithms) in tobacco research that have the abilities to synthesize evidence in social science and assist in research gap discovery for priority populations.</p>
      <p>In this pilot study, we aimed to achieve the following goals to address the identified research and application gaps: (1) compile a specialized semantic database for tobacco policy research to extract information from journal article abstracts, (2) develop NLP algorithms that comprehend the literature on nicotine and tobacco product use among sexual and gender diverse populations, and (3) compare the discoveries of the NLP algorithms with an ongoing systematic review of tobacco policy research among LGBTQ+ populations [<xref ref-type="bibr" rid="ref32">32</xref>]. While this pilot study does not fully address the gaps by developing a comprehensive evidence synthesis or discovery tool for tobacco research, the outcomes may pave the road for future tools that can achieve this goal. Our vision is that NLP tools may be able to assist academic scholars and policy makers in prescribing public health policies, such as tobacco control policies, and addressing public health needs, such as reducing health disparities.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Development of a Tobacco Research Domain–Specific Semantic Database</title>
        <sec>
          <title>Overview</title>
          <p>To generate a tobacco research domain-specific semantic database, we used an iterative process that combines expert opinions and the reading of tobacco research papers in 4 leading tobacco journals (<italic>Tobacco Control</italic>, <italic>Nicotine and Tobacco Research</italic>, <italic>Tobacco Induced Diseases</italic>, and <italic>Tobacco Prevention and Cessation</italic>). The main categories of keywords were the follows: (1) tobacco use behaviors, prevalence, and outcomes; (2) population characteristics; (3) geographic locations; (4) method and inference; (5) policy; (6) tobacco products; (7) relation statement; and (8) tobacco characteristics. Under each main category, there were one or more subcategories, and each subcategory contained a list of named entities. <xref ref-type="table" rid="table1">Table 1</xref> presents the categories of named entities in a domain-specific semantic database that were used for training and improving a language model for tobacco research on sexual and gender diverse populations. These categories are based on journal articles’ keywords, further guided by existing literature on how to use NLP methods to synthetize public health evidence [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref33">33</xref>]. These categories are important components of a study, encompassing measures, methods, results, conclusions, and hypothesis testing.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Main categories and subcategories of named entities.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="300"/>
              <col width="700"/>
              <thead>
                <tr valign="top">
                  <td>Main categories</td>
                  <td>Subcategories</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td>Tobacco use behavioral outcomes</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Tobacco cessation</p>
                      </list-item>
                      <list-item>
                        <p>Exposure to tobacco-related or antitobacco content, or exposure to secondhand or thirdhand smoking</p>
                      </list-item>
                      <list-item>
                        <p>Health and disease</p>
                      </list-item>
                      <list-item>
                        <p>Perception and belief</p>
                      </list-item>
                      <list-item>
                        <p>Tobacco use prevalence</p>
                      </list-item>
                      <list-item>
                        <p>Time period</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>Population characteristics</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Age groups</p>
                      </list-item>
                      <list-item>
                        <p>Sex</p>
                      </list-item>
                      <list-item>
                        <p>Sexual and gender diverse populations</p>
                      </list-item>
                      <list-item>
                        <p>Racial and ethnic minoritized groups</p>
                      </list-item>
                      <list-item>
                        <p>Socioeconomic status</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>Geographic locations</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Countries, states, provinces, or cities</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>Method and inference</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Data</p>
                      </list-item>
                      <list-item>
                        <p>Methodology</p>
                      </list-item>
                      <list-item>
                        <p>Statistics</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>Policy</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Marketing</p>
                      </list-item>
                      <list-item>
                        <p>Law, policy, and regulation</p>
                      </list-item>
                      <list-item>
                        <p>Regulation body</p>
                      </list-item>
                      <list-item>
                        <p>Treatment</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>Tobacco products</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Combustible tobacco products</p>
                      </list-item>
                      <list-item>
                        <p>Noncombustible tobacco products</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>Relation statement</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Relation terms</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>Tobacco characteristics</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Chemical</p>
                      </list-item>
                      <list-item>
                        <p>Flavor</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
              </tbody>
            </table>
          </table-wrap>
        </sec>
        <sec>
          <title>Journal Selection</title>
          <p>We chose 4 peer-reviewed tobacco-specific multidisciplinary journals, namely, <italic>Tobacco Control</italic>, <italic>Nicotine and Tobacco Research</italic>, <italic>Tobacco Induced Diseases</italic>, and <italic>Tobacco Prevention and Cessation</italic>, to extract articles and compile keywords at the initial stage. The first 2 are among the journals that have the highest impact factors in addiction research; in 2022, <italic>Tobacco Control</italic> had an impact factor of 5.2 and a 5-year impact factor of 5.7 [<xref ref-type="bibr" rid="ref34">34</xref>], and <italic>Nicotine and Tobacco Research</italic> had an impact factor of 4.7 and a 5-year impact factor of 4.2 [<xref ref-type="bibr" rid="ref35">35</xref>]. <italic>Tobacco Induced Diseases</italic> [<xref ref-type="bibr" rid="ref36">36</xref>] and <italic>Tobacco Prevention and Cessation</italic> [<xref ref-type="bibr" rid="ref37">37</xref>] are 2 other peer-reviewed journals that specifically publish research on nicotine and tobacco products but are not as highly ranked as the other 2 journals. The textual data from the 4 peer-reviewed journal articles contained a total of 2993 abstracts from published papers from 2015 to early 2021.</p>
          <p>While the 2993 articles extracted from these journals do not represent the full body of tobacco research, they cover a significant share of tobacco studies and integrate evidence across the 5 translational research stages: basic research, preclinical research, clinical research, clinical implementation, and public health. These journals also ask authors to specify how the research reported contributes to tobacco control objectives, which have policy implications. Alternatively, a random sampling from PubMed searches using tobacco related terms may not yield studies that are necessarily translational in nature. Therefore, we focused on the articles published in the 4 journals in our study.</p>
        </sec>
        <sec>
          <title>Iterative Process to Expand Terms (Named Entities) in the Database</title>
          <p>The general process included the following iterative steps: (1) to generate initial annotation data, we first complied key terms from extracted articles and allocated key terms to categories using group discussions; (2) we enriched the database using various sources and group discussions (more specific descriptions below); (3) we fine-tuned the <italic>spaCy</italic> en_core_web_lg model with the initial annotation and following iterative versions of data (the en_core_web_lg model is a pretrained large language model that can extract multiple general named entities); (4) we expanded the list of named entities to include more keywords of similar meanings using SeedNER [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>], that is, a small set of initial labeled examples or patterns that was used as a starting point for training a model; (5) we searched the occurrence of each keyword in the 2993 paper abstracts and kept those with high frequency; (6) during this process, named entities that were too generic to yield meaningful relations were removed from the database; and (7) we repeated steps 3 to 6 until the set of entities reached our satisfaction during group discussions.</p>
          <p>Specific approaches were used for conducting step 2. For categories including “tobacco use behavioral outcomes,” “tobacco products,” and “tobacco characteristics,” the iterative process involved four steps: (1) discussions to determine whether to include newly identified key terms and how to allocate them into additional subcategories (<xref ref-type="table" rid="table1">Table 1</xref>); (2) using a named entity recognition (NER) model to extract named entities from 2993 paper abstracts from the 4 specific journals; (3) randomly sampling and reviewing the output of the NER model, correcting identified errors, and adding missed NERs; and 4) repeating steps 1 to 3 until we were satisfied with the model output.</p>
          <p>The categories “population characteristics,” “geographic locations,” and “relation terms” are commonly used concepts in real life and not specific to tobacco control. We used Google searches, Wikipedia, and WordNet to enrich the key terms. In addition, for the “method and inference” category, we used the glossary of an econometrics methodology textbook by Cameron and Trividi to enrich the terms [<xref ref-type="bibr" rid="ref40">40</xref>]. This textbook is widely used in economics and social science and its glossary should provide sufficient terms for this category.</p>
          <p>For the “policy” category, we drew named entities from 2 sources that comprehensively summarize available tobacco control policies in the regulatory space. The first source was a peer-reviewed journal article by McDaniel et al [<xref ref-type="bibr" rid="ref41">41</xref>] that conducted an intensive policy scan of all possible regulations that can contribute to tobacco endgame. The second source was the World Health Organization’s report on the global progress in implementing tobacco control policies, as recommended by the World Health Organizaiton’s Framework Convention on Tobacco Control [<xref ref-type="bibr" rid="ref42">42</xref>], which is the largest public health treaty signed by 182 countries and prescribes a comprehensive set of tobacco control policies. These policies are classified into 5 groups: M (monitor tobacco use and prevention policies), P (protect people from tobacco smoke), O (offer help to quit tobacco use), W (warn about the dangers of tobacco), E (enforce bans on tobacco advertising, promotion, and sponsorship), and R (raise taxes on tobacco) [<xref ref-type="bibr" rid="ref42">42</xref>]. These sources cover policy key terms related to both national and international contexts and together create the most comprehensive policy terms to our knowledge.</p>
        </sec>
      </sec>
      <sec>
        <title>Development of NLP Algorithms That Comprehend the Literature on Nicotine and Tobacco Product Use Among Sexual and Gender Diverse Populations</title>
        <p>We used RoBERTa, an optimized BERT (bidirectional encoder representations from transformers)-based language model [<xref ref-type="bibr" rid="ref43">43</xref>], to perform NER tasks. BERT is a state-of-the-art language model that excels at tasks such as sentiment analysis and text summarization. By learning patterns and relationships between words and their context in text, BERT can extract named entities that it has learned during training and potentially discover new ones.</p>
        <p>We developed an NER model based on RoBERTa using the Python (Python Software Foundation) programming language and the <italic>spaCy</italic> library [<xref ref-type="bibr" rid="ref44">44</xref>]. We began by defining 36 labels of categories (main and subcategories; <xref ref-type="table" rid="table1">Table 1</xref>) and extracting 1582 named entities using the existing NER model RoBERTa. Next, those named entities were used to tag abstracts and create a training set, using the annotation tool Prodigy [<xref ref-type="bibr" rid="ref45">45</xref>]. A subset of the abstracts with labeled named entities was reviewed by 2 domain experts to identify key terms that were missing in our semantic database, which were added to the lists of named entities.</p>
        <p>The RoBERTa model was then updated based on the richer database and further trained for a maximum of 20,000 steps, with early stopping implemented if no improvement was observed for 1600 consecutive steps. With a series of iterations, we used the updated RoBERTa model to assess the 2993 abstracts and labeled them with the categories.</p>
        <p>When identifying studies related to LGBTQ+ populations, it is important to understand that this community is heterogeneous [<xref ref-type="bibr" rid="ref46">46</xref>,<xref ref-type="bibr" rid="ref47">47</xref>]. Given that LGBTQ+ key terms are included in the “population characteristics” categories, we were able to identify LGBTQ+ populations based on categorization. There were 111 LGBTQ+-related named entities in our database.</p>
      </sec>
      <sec>
        <title>Comparison of the Discoveries of the NLP Algorithms With an Ongoing Systematic Review of Tobacco Policy Research Among LGBTQ+ Populations</title>
        <p>Ideally, we would like to compare the results from our tools with those from systematic reviews and meta-analyses of studies related to tobacco control issues among LGBTQ+ populations. Systematic reviews and meta-analyses are state-of-the-art evidence synthesis methods that can provide the ground truth [<xref ref-type="bibr" rid="ref48">48</xref>-<xref ref-type="bibr" rid="ref50">50</xref>]. While we are currently conducting a separate systematic review of the effectiveness of tobacco control policies among LGBTQ+ populations, this review has not been finalized yet [<xref ref-type="bibr" rid="ref32">32</xref>]. Nonetheless, the ongoing systematic review does provide some data points for comparisons, including the number of studies extracted from the 4 journals and presence of policy assessment. Therefore, we conducted comparisons of these 2 domains.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study does not involve human subjects, as it synthesizes data from research articles published at peer-reviewed journals. The Ohio State University Institutional Review Board has determined that it contains no human subjects and thus no further review is needed (study number: 2021E0776).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>In total, we identified 33 articles relevant to sexual and gender diverse populations from the 2993 abstracts. Our trained model successfully extracted 773 named entities (181 unique named entities) from the 33 paper abstracts to describe the themes of these articles. Among the 773 extracted named entities, 688 were already learned by the model during training, while 70 were new time- or age-related words (eg, 18 years, 2013), 9 were new statistical terms (eg, N=20), and 6 were newly discovered and labeled within other categories. We did not observe any newly discovered policy-related terms.</p>
      <p>In <xref rid="figure1" ref-type="fig">Figures 1</xref>-<xref rid="figure3" ref-type="fig">3</xref>, we present the hierarchy of named entities extracted from abstracts in published papers that studied nicotine or tobacco product use among sexual and gender diverse individuals. Each number on the right is the frequency of the corresponding named entity by paper abstract. Named entities with the same color belong to the same main category.</p>
      <fig id="figure1" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Hierarchy and frequency counts of named entities extracted from published research in tobacco-specific journals from 2015 to early 2021 in 4 main categories: tobacco use, products, characteristics, and relation statement. Numbers represent the frequency of the corresponding named entity by paper abstract.</p>
        </caption>
        <graphic xlink:href="formative_v8i1e49031_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure2" position="float">
        <label>Figure 2</label>
        <caption>
          <p>Hierarchy and frequency counts of named entities extracted from published research in tobacco-specific journals from 2015 to early 2021 in the main category of population characteristics. Numbers represent the frequency of the corresponding named entity by paper abstract.</p>
        </caption>
        <graphic xlink:href="formative_v8i1e49031_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure3" position="float">
        <label>Figure 3</label>
        <caption>
          <p>Hierarchy and frequency counts of named entities extracted from published research in tobacco-specific journals from 2015 to early 2021 in 3 main categories: policy, methods and inference, and geographic locations. Numbers represent the frequency of the corresponding named entity by paper abstract.</p>
        </caption>
        <graphic xlink:href="formative_v8i1e49031_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>According to our tool, among the 33 tobacco studies related to LGBTQ+ populations, the most frequent use outcomes were “cigarette smoking” (n=17), “substance use” (n=16), “prevalence” (n=16), and “risk” perception (n=14). Also, for these populations, “cigarettes” (n=15) were the most frequently mentioned combustible tobacco product and “e-cigarettes are” (n=8) was the most frequently mentioned noncombustible tobacco product. In addition, for tobacco characteristics, “alcohol” (n=7) and “nicotine” (n=5) were the most mentioned attributes among LGBTQ+ tobacco research papers.</p>
      <p>The relation statement findings suggest that a majority of the studies examined “comparison” (n=26), “association” (n=23), and “correlation” (n=6). We found no studies that explicitly used the term “causal” or “causality” in the studies.</p>
      <p>The population characteristics mentioned in the studies illustrated that among socioeconomic status terms, the most frequently included were “demographics” (n=8) and “SES factors” (n=8). Among sex and sexual and gender minority terms, the most frequent ones were “bisexual” (n=21), “lesbian” (n=19), and “gay” (n=19). Among racial and ethnic minority group terms, the most frequent ones were “minority groups” (n=8) and “Race/ethnicity” (n=6). For age group terms, the terms included “adult” (n=14), “young adult” (n=11), “adolescent” (n=5), “students” (n=3), and “adolescents and young adults” (n=2).</p>
      <p>The policy category showed that in these studies, the most mentioned term was “intervention” (n=16). In addition, while the general term “tobacco control” was mentioned in 6 studies, only 1 study contained any specific policy term (“smoke free air law”). As such, there was a significant gap in policy research among the published articles in the 4 leading tobacco journals between 2015 and early 2021, since only 1 study mentions specific policies when it comes to tobacco research among the LGBTQ+ populations. The statistics and methodology terms further indicated that the most used terms included “survey” (n=18) and “logistic regression” (n=10), and relatively fewer studies mentioned terms related to causal inferences, such as “experimental research” (n=4), “randomization” (n=3), and “clinical trial” (n=1). The studies mentioning “US” also dominated in the numbers, with 12 studies in total. Several studies that assessed countries with multilevel governing levels, such as Canada and the United States, also appeared to have mentioned “state,” “city,” and “province,” suggesting that attention was paid to these defined areas.</p>
      <p>We next compared our results using the NLP tools with our ongoing systematic review. Similar to the conclusions of the ongoing systematic review, we found very few studies that yielded specific policy recommendations. This finding was further corroborated by the lack of causal inference methods labeled by the NLP tool. While our NLP tool cannot replace systematic reviews just yet, it does show potential to complement the existing methods and requires less human supervision (systematic reviews usually require at least 2 human coders).</p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>This pilot study builds a semantic database dedicated to tobacco research and developed NLP algorithms to automatically identify, extract, and summarize textual data from published tobacco studies. We further demonstrated a user case wherein we assessed LGBTQ+ tobacco research by labeling key components of a tobacco study: tobacco use outcomes, tobacco characteristics, population characteristics, geographic locations, method and inference, and policy relevance.</p>
      <p>It is worth noting that the components we categorized, such as “method and inference,” align with the typical sections found in scientific articles in social science, including measures, methods, results, conclusions, and hypothesis testing. As a result, our tool extracts text segments that are frequently assessed in evidence synthesis, thereby showing the potential of using NLP tools to enhance systematic reviews and facilitate meta-analyses [<xref ref-type="bibr" rid="ref25">25</xref>].</p>
      <p>Additionally, we leveraged the NLP algorithms we created to identify gaps in tobacco research concerning the LGBTQ+ populations and concluded that there is a scarcity of studies assessing policy impacts on this demographic using causal inference methods. This finding is consistent with our ongoing systematic review [<xref ref-type="bibr" rid="ref32">32</xref>], highlighting how NLPs have the capacity to aid in both evidence synthesis and research gap discoveries. This, in turn, has the potential to streamline research efforts, reduce labor costs, and influence the trajectories of future research directions [<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref52">52</xref>].</p>
      <p>Using the NLP tool, we further found some interesting patterns in tobacco research involving LGBTQ+ populations. It appears that the product drawing the most attention in the field is cigarettes or cigarette smoking and that the number of studies of various age groups is almost evenly distributed between youth or young adults and adults. Moreover, the existing evidence body is dominated by studies coming from the United States. These patterns are consistent with the research needs to reduce cigarette smoking among LGBTQ+ populations in the United States, where 16.1% of LGBTQ+ adults and 17.4% of LGBTQ+ high schooler students smoke cigarettes—this is 4% to 6% higher than their heterosexual counterparts [<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref54">54</xref>]. Therefore, our findings align with the ongoing research needs and the financial investments made by the US health agencies like the NIH, thereby bolstering the confidence in the NLP tool that we developed.</p>
      <p>Finally, while the semantic database and language model in this pilot study are designed to extract and summarize key components of tobacco research, many of the terms and labeling categories are broad and applicable to public health and social science research in general, such as “methods and inference” and “relation terms.” Therefore, our tool has the potential to transform the evidence synthesis paradigm in tobacco control and public health at large by enabling more efficient and effective analyses of large volumes of textual data. Future tool development may extend its reach to other public health domains, fostering the real-time translation of research findings into evidence-based policymaking, thereby contributing significantly to the advancement of public health initiatives.</p>
      <p>Our study has several limitations. First, for the development of keywords and the application of the NLP, we focused on 4 peer-reviewed tobacco-specific research journals, which were not representative of the entire tobacco control literature. However, considering the prominence and extensive content covered by these journals, we believe that this selection is unlikely to introduce significant selection bias or result in the omission of crucial keywords. Second, although we used our ongoing systematic review as a benchmark for the qualitative assessment of the results obtained in this pilot study, we did not perform a quantitative comparison of our findings with the ground truth derived from the systematic review. This quantitative evaluation, which might include measures like Cohen kappa, was not conducted because the systematic review has not yet been finalized. Consequently, future research endeavors are required to undertake a thorough quantitative comparison between the training data and the established ground truth using statistical testing for a more comprehensive assessment of the NLP tool’s performance.</p>
      <p>Despite the limitations, our pilot study serves as a compelling demonstration of the capabilities of NLP tools in expediting the processes of evidence synthesis and the identification of research gaps. Expanding the scope of this pilot research to encompass other public health disciplines, extending beyond the realm of tobacco control, holds the promise of fundamentally transforming the approach to evidence synthesis. Such expansion has the potential to play a pivotal role in shaping policy development across a wide spectrum of public health domains.</p>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Tobacco-related funding from the National Institutes of Health (NIH), 2010-2022. Data was obtained from the National Institutes of Health [<xref ref-type="bibr" rid="ref13">13</xref>].</p>
        <media xlink:href="formative_v8i1e49031_app1.png" xlink:title="PNG File , 102 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BERT</term>
          <def>
            <p>bidirectional encoder representations from transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">LGBTQ+</term>
          <def>
            <p>lesbian, gay, bisexual, transgender, queer, intersex, asexual, Two Spirit, and other persons who identify as part of this community</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">NER</term>
          <def>
            <p>named entity recognition</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">NIH</term>
          <def>
            <p>National Institutes of Health</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was supported by the President’s Research Excellence (PRE) Accelerator Grant from The Ohio State University (principal investigator: CS). CS was funded by the National Cancer Institute (R21CA249757). SM was supported by the Pelotonia Fellowship from The Ohio State University Comprehensive Cancer Center.</p>
      <p>During the preparation of this work, the authors used ChatGPT 3.5 in order to check grammar errors and improve language flow. After using this tool, the authors reviewed and edited the content as needed and take full responsibility for the content of the publication.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The data sets generated and analyzed during this study are available in the GitHub repository [<xref ref-type="bibr" rid="ref55">55</xref>].</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>CS and SM conceptualized the study. JC, ML, SJ, CS, and SM designed the methodology. SJ and ML were responsible for the software. CS and JC validated the data. SM and SJ performed the formal analysis. ML, SJ, and SM carried out the investigation. CS and JC provided resources. ML, OY, XZ, YF, YZ, SJ, and SM performed data curation. SM and SJ wrote the original draft. SM, SJ, JC, and CS reviewed and edited the manuscript. CS and JC supervised the study. ML and SJ were responsible for project administration. CS acquired funding. All authors have read and agreed to the published version of the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>United States Public Health Service Office of the Surgeon General</collab>
          </person-group>
          <article-title>Smoking cessation: a report of the surgeon general</article-title>
          <source>National Library of Medicine</source>
          <year>2020</year>
          <access-date>2024-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ncbi.nlm.nih.gov/books/NBK555591/">https://www.ncbi.nlm.nih.gov/books/NBK555591/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>National Center for Chronic Disease Prevention and Health Promotion (US) Office on Smoking and Health</collab>
          </person-group>
          <article-title>The health consequences of smoking- 50 years of progress</article-title>
          <source>National Library of Medicine</source>
          <year>2014</year>
          <access-date>2024-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ncbi.nlm.nih.gov/books/NBK179276/">https://www.ncbi.nlm.nih.gov/books/NBK179276/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <article-title>LGBTQ+ people experience a health burden from commercial tobacco</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <year>2022</year>
          <access-date>2024-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/tobacco/health-equity/lgbtq/health-burden.html">https://www.cdc.gov/tobacco/health-equity/lgbtq/health-burden.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Banbhrani</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Conditional probability joint extraction of nested biomedical events: design of a unified extraction framework based on neural networks</article-title>
          <source>JMIR Med Inform</source>
          <year>2022</year>
          <month>06</month>
          <day>07</day>
          <volume>10</volume>
          <issue>6</issue>
          <fpage>e37804</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2022/6/e37804/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/37804</pub-id>
          <pub-id pub-id-type="medline">35671070</pub-id>
          <pub-id pub-id-type="pii">v10i6e37804</pub-id>
          <pub-id pub-id-type="pmcid">PMC9214613</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elmessiry</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>WO</given-names>
            </name>
            <name name-style="western">
              <surname>Catron</surname>
              <given-names>TF</given-names>
            </name>
            <name name-style="western">
              <surname>Karrass</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>MP</given-names>
            </name>
          </person-group>
          <article-title>Triaging patient complaints: Monte Carlo cross-validation of six machine learning classifiers</article-title>
          <source>JMIR Med Inform</source>
          <year>2017</year>
          <month>07</month>
          <day>31</day>
          <volume>5</volume>
          <issue>3</issue>
          <fpage>e19</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2017/3/e19/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/medinform.7140</pub-id>
          <pub-id pub-id-type="medline">28760726</pub-id>
          <pub-id pub-id-type="pii">v5i3e19</pub-id>
          <pub-id pub-id-type="pmcid">PMC5556254</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Rankine</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Aghaarabi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Benchmarking effectiveness and efficiency of deep learning models for semantic textual similarity in the clinical domain: validation study</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>12</month>
          <day>30</day>
          <volume>9</volume>
          <issue>12</issue>
          <fpage>e27386</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/12/e27386/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/27386</pub-id>
          <pub-id pub-id-type="medline">34967748</pub-id>
          <pub-id pub-id-type="pii">v9i12e27386</pub-id>
          <pub-id pub-id-type="pmcid">PMC8759018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harvey</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Lobban</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Rayson</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Warner</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing methods and bipolar disorder: scoping review</article-title>
          <source>JMIR Ment Health</source>
          <year>2022</year>
          <month>04</month>
          <day>22</day>
          <volume>9</volume>
          <issue>4</issue>
          <fpage>e35928</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2022/4/e35928/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/35928</pub-id>
          <pub-id pub-id-type="medline">35451984</pub-id>
          <pub-id pub-id-type="pii">v9i4e35928</pub-id>
          <pub-id pub-id-type="pmcid">PMC9077496</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Singhal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Muttreja</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Piterova</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>An artificial intelligence chatbot for young people's sexual and reproductive health in India (SnehAI): instrumental case study</article-title>
          <source>J Med Internet Res</source>
          <year>2022</year>
          <month>01</month>
          <day>03</day>
          <volume>24</volume>
          <issue>1</issue>
          <fpage>e29969</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2022/1/e29969/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/29969</pub-id>
          <pub-id pub-id-type="medline">34982034</pub-id>
          <pub-id pub-id-type="pii">v24i1e29969</pub-id>
          <pub-id pub-id-type="pmcid">PMC8764609</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rasul</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>YJ</given-names>
            </name>
          </person-group>
          <article-title>Emotions and incivility in vaccine mandate discourse: natural language processing insights</article-title>
          <source>JMIR Infodemiology</source>
          <year>2022</year>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>e37635</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://infodemiology.jmir.org/2022/2/e37635/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/37635</pub-id>
          <pub-id pub-id-type="medline">36188420</pub-id>
          <pub-id pub-id-type="pii">v2i2e37635</pub-id>
          <pub-id pub-id-type="pmcid">PMC9511016</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>El Morr</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Maret</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Muhlenbach</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Dharmalingam</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Tadesse</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Creighton</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kundi</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Buettgen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mgwigwi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dinca-Panaitescu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dua</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Gorman</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>A virtual community for disability advocacy: development of a searchable artificial intelligence-supported platform</article-title>
          <source>JMIR Form Res</source>
          <year>2021</year>
          <month>11</month>
          <day>05</day>
          <volume>5</volume>
          <issue>11</issue>
          <fpage>e33335</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2021/11/e33335/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/33335</pub-id>
          <pub-id pub-id-type="medline">34738910</pub-id>
          <pub-id pub-id-type="pii">v5i11e33335</pub-id>
          <pub-id pub-id-type="pmcid">PMC8663581</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perry</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Creamer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chaffee</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Unger</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sutfin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kong</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Clendennen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Krishnan-Sarin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pentz</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Research on youth and young adult tobacco use, 2013-2018, from the Food and Drug Administration-National Institutes of Health Tobacco Centers of Regulatory Science</article-title>
          <source>Nicotine Tob Res</source>
          <year>2020</year>
          <month>06</month>
          <day>12</day>
          <volume>22</volume>
          <issue>7</issue>
          <fpage>1063</fpage>
          <lpage>1076</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31127298"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/ntr/ntz059</pub-id>
          <pub-id pub-id-type="medline">31127298</pub-id>
          <pub-id pub-id-type="pii">5476524</pub-id>
          <pub-id pub-id-type="pmcid">PMC7457341</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Higgins</surname>
              <given-names>ST</given-names>
            </name>
            <name name-style="western">
              <surname>Kurti</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Palmer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tidey</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Cepeda-Benito</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Krebs</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Baezconde-Garbanati</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hart</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Stanton</surname>
              <given-names>CA</given-names>
            </name>
          </person-group>
          <article-title>A review of tobacco regulatory science research on vulnerable populations</article-title>
          <source>Prev Med</source>
          <year>2019</year>
          <month>11</month>
          <volume>128</volume>
          <fpage>105709</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S0091-7435(19)30163-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ypmed.2019.04.024</pub-id>
          <pub-id pub-id-type="medline">31054904</pub-id>
          <pub-id pub-id-type="pii">S0091-7435(19)30163-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC6824984</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="web">
          <article-title>RePORTER</article-title>
          <source>National Institutes of Health</source>
          <access-date>2024-01-19</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://reporter.nih.gov/">https://reporter.nih.gov/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Neumann</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Beltagy</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Ammar</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>ScispaCy: fast and robust models for biomedical natural language processing</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on February 20, 2019. <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1902.07669"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/w19-5034</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nadkarni</surname>
              <given-names>PM</given-names>
            </name>
            <name name-style="western">
              <surname>Ohno-Machado</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>WW</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing: an introduction</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2011</year>
          <volume>18</volume>
          <issue>5</issue>
          <fpage>544</fpage>
          <lpage>551</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/21846786"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/amiajnl-2011-000464</pub-id>
          <pub-id pub-id-type="medline">21846786</pub-id>
          <pub-id pub-id-type="pii">amiajnl-2011-000464</pub-id>
          <pub-id pub-id-type="pmcid">PMC3168328</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Hogan</surname>
              <given-names>WR</given-names>
            </name>
            <name name-style="western">
              <surname>Crowley</surname>
              <given-names>RS</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing methods and systems for biomedical ontology learning</article-title>
          <source>J Biomed Inform</source>
          <year>2011</year>
          <month>02</month>
          <volume>44</volume>
          <issue>1</issue>
          <fpage>163</fpage>
          <lpage>179</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(10)00105-X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2010.07.006</pub-id>
          <pub-id pub-id-type="medline">20647054</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(10)00105-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC2990796</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yoon</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>So</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>BioBERT: a pre-trained biomedical language representation model for biomedical text mining</article-title>
          <source>Bioinformatics</source>
          <year>2020</year>
          <month>02</month>
          <day>15</day>
          <volume>36</volume>
          <issue>4</issue>
          <fpage>1234</fpage>
          <lpage>1240</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31501885"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btz682</pub-id>
          <pub-id pub-id-type="medline">31501885</pub-id>
          <pub-id pub-id-type="pii">5566506</pub-id>
          <pub-id pub-id-type="pmcid">PMC7703786</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nallapati</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Nogueira dos santos</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gulcehre</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Xiang</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Abstractive text summarization using sequence-to-sequence RNNs and beyond</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on February 19, 2016. <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1602.06023"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oliveira</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Niccolai</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ortiz</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Sheth</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Shapiro</surname>
              <given-names>ED</given-names>
            </name>
            <name name-style="western">
              <surname>Niccolai</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Brandt</surname>
              <given-names>CA</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing for surveillance of cervical and anal cancer and precancer: algorithm development and split-validation study</article-title>
          <source>JMIR Med Inform</source>
          <year>2020</year>
          <month>11</month>
          <day>03</day>
          <volume>8</volume>
          <issue>11</issue>
          <fpage>e20826</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2020/11/e20826/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/20826</pub-id>
          <pub-id pub-id-type="medline">32469840</pub-id>
          <pub-id pub-id-type="pii">v8i11e20826</pub-id>
          <pub-id pub-id-type="pmcid">PMC7671846</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rybinski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Karimi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Extracting family history information from electronic health records: natural language processing analysis</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>04</month>
          <day>30</day>
          <volume>9</volume>
          <issue>4</issue>
          <fpage>e24020</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/4/e24020/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24020</pub-id>
          <pub-id pub-id-type="medline">33664015</pub-id>
          <pub-id pub-id-type="pii">v9i4e24020</pub-id>
          <pub-id pub-id-type="pmcid">PMC8092929</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Moon</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ai</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kavuluru</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Acquisition of a lexicon for family history information: bidirectional encoder representations from transformers-assisted sublanguage analysis</article-title>
          <source>JMIR Med Inform</source>
          <year>2023</year>
          <month>06</month>
          <day>27</day>
          <volume>11</volume>
          <fpage>e48072</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2023//e48072/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/48072</pub-id>
          <pub-id pub-id-type="medline">37368483</pub-id>
          <pub-id pub-id-type="pii">v11i1e48072</pub-id>
          <pub-id pub-id-type="pmcid">PMC10337517</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tomaszewski</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Morales</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lourentzou</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Caskey</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chin</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Identifying false human papillomavirus (HPV) vaccine information and corresponding risk perceptions from Twitter: advanced predictive models</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>09</month>
          <day>09</day>
          <volume>23</volume>
          <issue>9</issue>
          <fpage>e30451</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/9/e30451/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/30451</pub-id>
          <pub-id pub-id-type="medline">34499043</pub-id>
          <pub-id pub-id-type="pii">v23i9e30451</pub-id>
          <pub-id pub-id-type="pmcid">PMC8461539</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stevens</surname>
              <given-names>HR</given-names>
            </name>
            <name name-style="western">
              <surname>Acic</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Rhea</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing insight into LGBTQ+ youth mental health during the COVID-19 pandemic: longitudinal content analysis of anxiety-provoking topics and trends in emotion in LGBTeens microcommunity subreddit</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2021</year>
          <month>08</month>
          <day>17</day>
          <volume>7</volume>
          <issue>8</issue>
          <fpage>e29029</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2021/8/e29029/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/29029</pub-id>
          <pub-id pub-id-type="medline">34402803</pub-id>
          <pub-id pub-id-type="pii">v7i8e29029</pub-id>
          <pub-id pub-id-type="pmcid">PMC8372845</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kundu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chaiton</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Billington</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Grace</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Logie</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Baskerville</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Yager</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mitsakakis</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Machine learning applications in mental health and substance use research among the LGBTQ2S+ population: scoping review</article-title>
          <source>JMIR Med Inform</source>
          <year>2021</year>
          <month>11</month>
          <day>11</day>
          <volume>9</volume>
          <issue>11</issue>
          <fpage>e28962</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2021/11/e28962/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/28962</pub-id>
          <pub-id pub-id-type="medline">34762059</pub-id>
          <pub-id pub-id-type="pii">v9i11e28962</pub-id>
          <pub-id pub-id-type="pmcid">PMC8663464</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baclic</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Tunis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Young</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Doan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Swerdfeger</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Schonfeld</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Challenges and opportunities for public health made possible by advances in natural language processing</article-title>
          <source>Can Commun Dis Rep</source>
          <year>2020</year>
          <month>06</month>
          <day>04</day>
          <volume>46</volume>
          <issue>6</issue>
          <fpage>161</fpage>
          <lpage>168</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32673380"/>
          </comment>
          <pub-id pub-id-type="doi">10.14745/ccdr.v46i06a02</pub-id>
          <pub-id pub-id-type="medline">32673380</pub-id>
          <pub-id pub-id-type="pii">460602</pub-id>
          <pub-id pub-id-type="pmcid">PMC7343054</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="web">
          <article-title>Achieving health equity in tobacco control</article-title>
          <source>Truth Initiative</source>
          <year>2015</year>
          <access-date>2024-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://truthinitiative.org/sites/default/files/media/files/2019/03/Achieving">https://truthinitiative.org/sites/default/files/media/files/2019/03/Achieving</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hopkins</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Razi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Leeks</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Priya Kalra</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Chattopadhyay</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Soler</surname>
              <given-names>RE</given-names>
            </name>
          </person-group>
          <article-title>Smokefree policies to reduce tobacco use. A systematic review</article-title>
          <source>Am J Prev Med</source>
          <year>2010</year>
          <month>02</month>
          <volume>38</volume>
          <issue>2 Suppl</issue>
          <fpage>S275</fpage>
          <lpage>S289</lpage>
          <pub-id pub-id-type="doi">10.1016/j.amepre.2009.10.029</pub-id>
          <pub-id pub-id-type="medline">20117612</pub-id>
          <pub-id pub-id-type="pii">S0749-3797(09)00751-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mays</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Boyle</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tam</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chaloupka</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>The effect of tobacco control policies on US smokeless tobacco use: a structured review</article-title>
          <source>Nicotine Tob Res</source>
          <year>2017</year>
          <month>12</month>
          <day>13</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <lpage>11</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27798090"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/ntr/ntw291</pub-id>
          <pub-id pub-id-type="medline">27798090</pub-id>
          <pub-id pub-id-type="pii">ntw291</pub-id>
          <pub-id pub-id-type="pmcid">PMC5896466</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chaloupka</surname>
              <given-names>FJ</given-names>
            </name>
            <name name-style="western">
              <surname>Straif</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Leon</surname>
              <given-names>ME</given-names>
            </name>
            <collab>Working Group‚ International Agency for Research on Cancer</collab>
          </person-group>
          <article-title>Effectiveness of tax and price policies in tobacco control</article-title>
          <source>Tob Control</source>
          <year>2011</year>
          <month>05</month>
          <volume>20</volume>
          <issue>3</issue>
          <fpage>235</fpage>
          <lpage>238</lpage>
          <pub-id pub-id-type="doi">10.1136/tc.2010.039982</pub-id>
          <pub-id pub-id-type="medline">21115556</pub-id>
          <pub-id pub-id-type="pii">tc.2010.039982</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Flor</surname>
              <given-names>LS</given-names>
            </name>
            <name name-style="western">
              <surname>Reitsma</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gakidou</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The effects of tobacco control policies on global smoking prevalence</article-title>
          <source>Nat Med</source>
          <year>2021</year>
          <month>02</month>
          <volume>27</volume>
          <issue>2</issue>
          <fpage>239</fpage>
          <lpage>243</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33479500"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41591-020-01210-8</pub-id>
          <pub-id pub-id-type="medline">33479500</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-020-01210-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC7884287</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Feliu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Filippidis</surname>
              <given-names>FT</given-names>
            </name>
            <name name-style="western">
              <surname>Joossens</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Fong</surname>
              <given-names>GT</given-names>
            </name>
            <name name-style="western">
              <surname>Vardavas</surname>
              <given-names>CI</given-names>
            </name>
            <name name-style="western">
              <surname>Baena</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Castellano</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fernández</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Impact of tobacco control policies on smoking prevalence and quit ratios in 27 European Union countries from 2006 to 2014</article-title>
          <source>Tob Control</source>
          <year>2019</year>
          <month>01</month>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>101</fpage>
          <lpage>109</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://tobaccocontrol.bmj.com/lookup/pmidlookup?view=long&#38;pmid=29472445"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/tobaccocontrol-2017-054119</pub-id>
          <pub-id pub-id-type="medline">29472445</pub-id>
          <pub-id pub-id-type="pii">tobaccocontrol-2017-054119</pub-id>
          <pub-id pub-id-type="pmcid">PMC6317447</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mirza</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schuster</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bridges</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>A systematic review of the effects of tobacco control policies on tobacco use among LGBTQIA+ populations</article-title>
          <source>PROSPERO 2022 CRD42022360559</source>
          <access-date>2024-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.crd.york.ac.uk/prospero/display_record.php?ID=CRD42022360559">https://www.crd.york.ac.uk/prospero/display_record.php?ID=CRD42022360559</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hamilton</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Strauss</surname>
              <given-names>AT</given-names>
            </name>
            <name name-style="western">
              <surname>Martinez</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Hinson</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Levin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>EY</given-names>
            </name>
          </person-group>
          <article-title>Machine learning and artificial intelligence: applications in healthcare epidemiology</article-title>
          <source>Antimicrob Steward Healthc Epidemiol</source>
          <year>2021</year>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>e28</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36168500"/>
          </comment>
          <pub-id pub-id-type="doi">10.1017/ash.2021.192</pub-id>
          <pub-id pub-id-type="medline">36168500</pub-id>
          <pub-id pub-id-type="pii">S2732494X21001923</pub-id>
          <pub-id pub-id-type="pmcid">PMC9495400</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <article-title>About</article-title>
          <source>Tobacco Control</source>
          <access-date>2023-12-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://tobaccocontrol.bmj.com/pages/about">https://tobaccocontrol.bmj.com/pages/about</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="web">
          <article-title>About the journal</article-title>
          <source>Nicotine &#38; Tobacco Research</source>
          <access-date>2023-12-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://academic.oup.com/ntr/pages/About">https://academic.oup.com/ntr/pages/About</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <article-title>Aims and scope</article-title>
          <source>Tobacco Induced Diseases</source>
          <access-date>2023-12-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.tobaccoinduceddiseases.org/Aims-and-Scope,386.html">http://www.tobaccoinduceddiseases.org/Aims-and-Scope,386.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
          <source>Tobacco Prevention &#38; Cessation</source>
          <access-date>2023-12-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.tobaccopreventioncessation.com/Aim-Scope,198.html">http://www.tobaccopreventioncessation.com/Aim-Scope,198.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ratinov</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Roth</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Design challenges and misconceptions in named entity recognition</article-title>
          <source>CoNLL '09</source>
          <access-date>2024-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://cogcomp.org/papers/RatinovRo09.pdf">http://cogcomp.org/papers/RatinovRo09.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Voss</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Automated phrase mining from massive text corpora</article-title>
          <source>IEEE Trans Knowl Data Eng</source>
          <year>2018</year>
          <month>10</month>
          <day>1</day>
          <volume>30</volume>
          <issue>10</issue>
          <fpage>1825</fpage>
          <lpage>1837</lpage>
          <pub-id pub-id-type="doi">10.1109/tkde.2018.2812203</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cameron</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Trivedi</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <source>Microeconometrics: Methods and Applications</source>
          <year>2005</year>
          <publisher-loc>Cambridge, United Kingdom</publisher-loc>
          <publisher-name>Cambridge University Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McDaniel</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Malone</surname>
              <given-names>RE</given-names>
            </name>
          </person-group>
          <article-title>The tobacco endgame: a qualitative review and synthesis</article-title>
          <source>Tob Control</source>
          <year>2016</year>
          <month>09</month>
          <volume>25</volume>
          <issue>5</issue>
          <fpage>594</fpage>
          <lpage>604</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://tobaccocontrol.bmj.com/lookup/pmidlookup?view=long&#38;pmid=26320149"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/tobaccocontrol-2015-052356</pub-id>
          <pub-id pub-id-type="medline">26320149</pub-id>
          <pub-id pub-id-type="pii">tobaccocontrol-2015-052356</pub-id>
          <pub-id pub-id-type="pmcid">PMC5036259</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="web">
          <article-title>WHO report on the global tobacco epidemic 2021: addressing new and emerging products</article-title>
          <source>World Health Organization</source>
          <year>2021</year>
          <access-date>2024-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/publications/i/item/9789240032095">https://www.who.int/publications/i/item/9789240032095</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ott</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Goyal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Joshi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Levy</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zettlemoyer</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Stoyanov</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>RoBERTa: a robustly optimized BERT pretraining approach</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on July 26, 2019. <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1907.11692"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
          <source>spaCy</source>
          <access-date>2024-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://spacy.io/">https://spacy.io/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
          <source>Prodigy</source>
          <access-date>2024-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://prodi.gy/features/named-entity-recognition">https://prodi.gy/features/named-entity-recognition</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>White</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sepúlveda</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>CJ</given-names>
            </name>
          </person-group>
          <source>Understanding the Well-Being of LGBTQI+ Populations</source>
          <year>2020</year>
          <publisher-loc>Washington, DC</publisher-loc>
          <publisher-name>National Academies Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="web">
          <article-title>LGBTQIA resource center glossary</article-title>
          <source>University of California, Davis</source>
          <year>2023</year>
          <access-date>2024-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://lgbtqia.ucdavis.edu/educated/glossary">https://lgbtqia.ucdavis.edu/educated/glossary</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gopalakrishnan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ganeshkumar</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Systematic reviews and meta-analysis: understanding the best evidence in primary healthcare</article-title>
          <source>J Family Med Prim Care</source>
          <year>2013</year>
          <month>01</month>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>9</fpage>
          <lpage>14</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jfmpc.com/article.asp?issn=2249-4863;year=2013;volume=2;issue=1;spage=9;epage=14;aulast=Gopalakrishnan"/>
          </comment>
          <pub-id pub-id-type="doi">10.4103/2249-4863.109934</pub-id>
          <pub-id pub-id-type="medline">24479036</pub-id>
          <pub-id pub-id-type="pii">JFMPC-2-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC3894019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sriganesh</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Shanthanna</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Busse</surname>
              <given-names>JW</given-names>
            </name>
          </person-group>
          <article-title>A brief overview of systematic reviews and meta-analyses</article-title>
          <source>Indian J Anaesth</source>
          <year>2016</year>
          <month>09</month>
          <volume>60</volume>
          <issue>9</issue>
          <fpage>689</fpage>
          <lpage>694</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.ijaweb.org/article.asp?issn=0019-5049;year=2016;volume=60;issue=9;spage=689;epage=694;aulast=Sriganesh"/>
          </comment>
          <pub-id pub-id-type="doi">10.4103/0019-5049.190628</pub-id>
          <pub-id pub-id-type="medline">27729699</pub-id>
          <pub-id pub-id-type="pii">IJA-60-689</pub-id>
          <pub-id pub-id-type="pmcid">PMC5037953</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gorelik</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gorelik</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ridout</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nimarko</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Peisch</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Kuramkote</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Low</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nrusimha</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Applying machine learning to increase efficiency and accuracy of meta-analytic review</article-title>
          <source>bioRxiv</source>
          <comment>Preprint posted online on October 8, 2020. <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.biorxiv.org/content/10.1101/2020.10.06.314245v1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1101/2020.10.06.314245</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Michelson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chow</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tee Qiao Ying</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Minton</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence for rapid meta-analysis: case study on ocular toxicity of hydroxychloroquine</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>08</month>
          <day>17</day>
          <volume>22</volume>
          <issue>8</issue>
          <fpage>e20007</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/8/e20007/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/20007</pub-id>
          <pub-id pub-id-type="medline">32804086</pub-id>
          <pub-id pub-id-type="pii">v22i8e20007</pub-id>
          <pub-id pub-id-type="pmcid">PMC7459430</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marshall</surname>
              <given-names>IJ</given-names>
            </name>
            <name name-style="western">
              <surname>Wallace</surname>
              <given-names>BC</given-names>
            </name>
          </person-group>
          <article-title>Toward systematic review automation: a practical guide to using machine learning tools in research synthesis</article-title>
          <source>Syst Rev</source>
          <year>2019</year>
          <month>07</month>
          <day>11</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>163</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://systematicreviewsjournal.biomedcentral.com/articles/10.1186/s13643-019-1074-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13643-019-1074-9</pub-id>
          <pub-id pub-id-type="medline">31296265</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13643-019-1074-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC6621996</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cornelius</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Loretan</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Jamal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Homa</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Tobacco product use among adults - United States, 2020</article-title>
          <source>MMWR Morb Mortal Wkly Rep</source>
          <year>2022</year>
          <month>03</month>
          <day>18</day>
          <volume>71</volume>
          <issue>11</issue>
          <fpage>397</fpage>
          <lpage>405</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.15585/mmwr.mm7111a1"/>
          </comment>
          <pub-id pub-id-type="doi">10.15585/mmwr.mm7111a1</pub-id>
          <pub-id pub-id-type="medline">35298455</pub-id>
          <pub-id pub-id-type="pmcid">PMC8942309</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gentzke</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Cornelius</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Park-Lee</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Sawdey</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Cullen</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Loretan</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jamal</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Homa</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>Tobacco product use and associated factors among middle and high school students - National Youth Tobacco Survey, United States, 2021</article-title>
          <source>MMWR Surveill Summ</source>
          <year>2022</year>
          <month>03</month>
          <day>11</day>
          <volume>71</volume>
          <issue>5</issue>
          <fpage>1</fpage>
          <lpage>29</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35271557"/>
          </comment>
          <pub-id pub-id-type="doi">10.15585/mmwr.ss7105a1</pub-id>
          <pub-id pub-id-type="medline">35271557</pub-id>
          <pub-id pub-id-type="pmcid">PMC8923300</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>LGBTQ-NER</article-title>
          <source>GitHub</source>
          <year>2023</year>
          <access-date>2024-01-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/jiangsn/LGBTQ-NER">https://github.com/jiangsn/LGBTQ-NER</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
