<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id><journal-id journal-id-type="publisher-id">formative</journal-id><journal-id journal-id-type="index">27</journal-id><journal-title>JMIR Formative Research</journal-title><abbrev-journal-title>JMIR Form Res</abbrev-journal-title><issn pub-type="epub">2561-326X</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v8i1e63188</article-id><article-id pub-id-type="doi">10.2196/63188</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Comparing the Accuracy of Two Generated Large Language Models in Identifying Health-Related Rumors or Misconceptions and the Applicability in Health Science Popularization: Proof-of-Concept Study</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Luo</surname><given-names>Yuan</given-names></name><degrees>RN, MNS, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Miao</surname><given-names>Yiqun</given-names></name><degrees>RN, MNS, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Zhao</surname><given-names>Yuhan</given-names></name><degrees>RN, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Li</surname><given-names>Jiawei</given-names></name><degrees>BSc, RN</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Chen</surname><given-names>Yuling</given-names></name><degrees>RN, PhD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Yue</surname><given-names>Yuexue</given-names></name><degrees>RN, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Wu</surname><given-names>Ying</given-names></name><degrees>RN, FAAN, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>School of Nursing, Capital Medical University</institution>, <addr-line>10 Xitoutiao, Youanmen Wai, Fengtai District</addr-line><addr-line>Beijing</addr-line>, <country>China</country></aff><aff id="aff2"><institution>School of Nursing, Johns Hopkins University</institution>, <addr-line>Baltimore</addr-line><addr-line>MD</addr-line>, <country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Wang</surname><given-names>Ming-Hung</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Shalaby</surname><given-names>Mohammed Nader</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Ying Wu, RN, FAAN, PhD, School of Nursing, Capital Medical University, 10 Xitoutiao, Youanmen Wai, Fengtai District, Beijing, 100069, China, 86 10839117; <email>helenywu@vip.163.com</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2024</year></pub-date><pub-date pub-type="epub"><day>2</day><month>12</month><year>2024</year></pub-date><volume>8</volume><elocation-id>e63188</elocation-id><history><date date-type="received"><day>12</day><month>06</month><year>2024</year></date><date date-type="rev-recd"><day>04</day><month>10</month><year>2024</year></date><date date-type="accepted"><day>10</day><month>10</month><year>2024</year></date></history><copyright-statement>&#x00A9;Yuan Luo, Yiqun Miao, Yuhan Zhao, Jiawei Li, Yuling Chen, Yuexue Yue, Ying Wu. Originally published in JMIR Formative Research (<ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>), 2.12.2024. </copyright-statement><copyright-year>2024</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://formative.jmir.org/2024/1/e63188"/><abstract><sec><title>Background</title><p>Health-related rumors and misconceptions are spreading at an alarming rate, fueled by the rapid development of the internet and the exponential growth of social media platforms. This phenomenon has become a pressing global concern, as the dissemination of false information can have severe consequences, including widespread panic, social instability, and even public health crises.</p></sec><sec><title>Objective</title><p>The aim of the study is to compare the accuracy of rumor identification and the effectiveness of health science popularization between 2 generated large language models in Chinese (GPT-4 by OpenAI and Enhanced Representation through Knowledge Integration Bot [ERNIE Bot] 4.0 by Baidu).</p></sec><sec sec-type="methods"><title>Methods</title><p>In total, 20 health rumors and misconceptions, along with 10 health truths, were randomly inputted into GPT-4 and ERNIE Bot 4.0. We prompted them to determine whether the statements were rumors or misconceptions and provide explanations for their judgment. Further, we asked them to generate a health science popularization essay. We evaluated the outcomes in terms of accuracy, effectiveness, readability, and applicability. Accuracy was assessed by the rate of correctly identifying health-related rumors, misconceptions, and truths. Effectiveness was determined by the accuracy of the generated explanation, which was assessed collaboratively by 2 research team members with a PhD in nursing. Readability was calculated by the readability formula of Chinese health education materials. Applicability was evaluated by the Chinese Suitability Assessment of Materials.</p></sec><sec sec-type="results"><title>Results</title><p>GPT-4 and ERNIE Bot 4.0 correctly identified all health rumors and misconceptions (100% accuracy rate). For truths, the accuracy rate was 70% (7/10) and 100% (10/10), respectively. Both mostly provided widely recognized viewpoints without obvious errors. The average readability score for the health essays was 2.92 (SD 0.85) for GPT-4 and 3.02 (SD 0.84) for ERNIE Bot 4.0 (<italic>P</italic>=.65). For applicability, except for the content and cultural appropriateness category, significant differences were observed in the total score and scores in other dimensions between them (<italic>P</italic>&#x003C;.05).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>ERNIE Bot 4.0 demonstrated similar accuracy to GPT-4 in identifying Chinese rumors. Both provided widely accepted views, despite some inaccuracies. These insights enhance understanding and correct misunderstandings. For health essays, educators can learn from readable language styles of GLLMs. Finally, ERNIE Bot 4.0 aligns with Chinese expression habits, making it a good choice for a better Chinese reading experience.</p></sec></abstract><kwd-group><kwd>rumor</kwd><kwd>misconception</kwd><kwd>health science popularization</kwd><kwd>health education</kwd><kwd>large language model</kwd><kwd>LLM</kwd><kwd>applicability</kwd><kwd>accuracy</kwd><kwd>effectiveness</kwd><kwd>health related</kwd><kwd>education</kwd><kwd>health science</kwd><kwd>proof of concept</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>In modern society, rapid information dissemination has given rise to a range of issues, one of which is health-related rumors and misconceptions [<xref ref-type="bibr" rid="ref1">1</xref>]. When people misunderstand health information, these misconceptions are continually propagated, making it easy for rumors to arise [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. These misconceptions can mislead people to make harmful decisions due to a lack of accurate guidance [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Notably, the general public often lacks scientific knowledge about health information, posing a challenge in distinguishing rumors and misconceptions from truth. Meanwhile, the endogenous health information demand of the public stimulates its dissemination by mass media while providing opportunities for rumor mongers to spread rumors [<xref ref-type="bibr" rid="ref6">6</xref>]. Up to now, official media or institutions have been the main force in debunking rumors and misconceptions. However, relying on official institutions for the refutation has limitations. The lack of medical and health expertise in official media or institutions leads to a slow official response to unexpected public health issues [<xref ref-type="bibr" rid="ref7">7</xref>]. Over time, the delayed response can undermine public trust and confidence [<xref ref-type="bibr" rid="ref8">8</xref>].</p><p>Health workers have the responsibility to undertake health science popularization work, so as to change the public&#x2019;s misconceptions. However, in practical work, the effect of traditional health education patterns is limited. The emergence of generated large language models (GLLMs) has opened up new possibilities for the identification of health-related rumors. In previous studies, GLLMs can be used to create debunking messages against health-related rumors [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. In China, Baidu developed the Enhanced Representation through Knowledge Integration Bot (ERNIE Bot) in 2019. Now, GPT-4 (OpenAI) and ERNIE Bot 4.0 represent the most recent advancements, having undergone significant enhancements in their capabilities [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. Previous studies have found that ChatGPT could provide relatively precise health information in the English context [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. However, health-related rumors and misconceptions may exhibit different characteristics across different languages and cultural backgrounds, posing higher demands on the generalization capabilities of the models. Mandarin is one of the most widely spoken languages in the world, making it crucial to examine the effectiveness of GLLMs within its linguistic context. Such exploration could potentially lead to improvements in the cultural sensitivity of models, thereby enhancing their utility for a wide range of applications in the Chinese-speaking community. Therefore, we conducted a proof-of-concept study to compare GPT-4 and ERNIE Bot 4.0 within the Chinese context. The aims were to explore the accuracy of identifying health-related rumors or misconceptions by GPT-4 and ERNIE Bot 4.0 and to further evaluate the applicability of health science popularization essays generated by them.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Ethical Considerations</title><p>This study aimed to compare the accuracy of rumor identification and the effectiveness of health science popularization between GPT-4 and ERNIE Bot 4.0, which did not involve the recruitment of human participants. We used health-related rumors, misconceptions, and truths sourced from publicly accessible web-based platforms to test GPT-4 and ERNIE Bot 4.0. The requirement for a formal ethical review was waived. In this study, all researchers, data collectors, and evaluators were aware of the research objectives and conducted the research in accordance with the study design. This study posed no harm to them.</p></sec><sec id="s2-2"><title>Materials and Designs</title><p>The health-related rumors, misconceptions, and truths were selected from the China Internet Disinformation Platform (CIDP). The inclusive materials were issued from January 1 to December 10, 2023. Based on previous proof-of-concept studies, a sample size of 30 is required for feasibility testing [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. Considering the primary objective was to investigate the identification capabilities, the ratio of rumors and misconceptions to truths was 2:1. By using a 2:1 ratio, we aimed to ensure that rumors, which are often more prevalent and varied in web-based environments, were adequately represented in our sample. Considering practical constraints such as time and resource limitations, the 2:1 ratio allowed us to manage these constraints while still achieving a representative and meaningful dataset for our research objectives. The rumors and misconceptions were from the &#x201C;Internet Rumor Exposure Station&#x201D; of the CIDP. In total, 20 health-related rumors and misconceptions were randomly selected using the random number table method. The truths were from &#x201C;True Knowledge&#x201D; of the CIDP, an expert-led video platform for debunking rumors. We randomly chose 10 health-related videos. To ensure accuracy, information extraction was completed through discussion by 3 PhD students (YL, YM, and YZ). All samples were randomly inputted into the 2 models in Chinese. Before inputting, the questioning was standardized through group discussion within the research team (YL, YM, and YZ). The questions were conducted in that order. The study process is presented in <xref ref-type="fig" rid="figure1">Figure 1</xref>. All the above work has been completed on December 25&#x2010;26, 2023. All materials and questions are shown in detail in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>The study process. ERNIE Bot: Enhanced Representation through Knowledge Integration Bot.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v8i1e63188_fig01.png"/></fig></sec><sec id="s2-3"><title>Evaluation</title><sec id="s2-3-1"><title>Accuracy</title><p>Accuracy was assessed by the rate of correctly identifying health-related rumors, misconceptions, and truths. The criterion is whether the model accurately classifies information as a rumor, misconception, or truth in its response. Considering the high similarity between rumors and misconceptions in practice, this study did not overly distinguish between them. As long as the response raised doubts and the study group deemed the doubts reasonable upon discussion, it is considered an accurate judgment.</p></sec><sec id="s2-3-2"><title>Effectiveness</title><p>Effectiveness refers to the degree of correctness in explaining the material. The effectiveness of the explanations was critically appraised. Two researchers (YL and YM) collaboratively searched for relevant evidence, such as the latest relevant guidelines, consensus, standards, or high-quality studies. We compared whether the explanations and recommendations provided by the 2 models align with relevant evidence.</p></sec><sec id="s2-3-3"><title>Readability</title><p>Readability refers to the ease with which a reader can understand a written text. Readability was calculated by the formula [<xref ref-type="bibr" rid="ref17">17</xref>]: <italic>R</italic> = 17.5255 + 0.0024<italic>X</italic><sub>1</sub> + 0.04415<italic>X</italic><sub>2</sub> &#x2212; 18.3344 (1 &#x2212; <italic>X</italic><sub>3</sub>), where <italic>R</italic> represents the readability level of the health information. The smaller <italic>R</italic> value indicates that the health essay is easier to read, and the range of <italic>R</italic> value represents reading grade level. For example, 2&#x2264;<italic>R</italic>&#x003C;3 represents the material that was suitable for grades 2-3. <italic>X</italic><sub>1</sub> represents the total number of words in the material, excluding punctuation. <italic>X</italic><sub>2</sub> represents average sentence length, which is the ratio of total word number to complete sentence number (a complete sentence is a sentence that ends with a period, question mark, or exclamation point). <italic>X</italic><sub>3</sub> represents the percentage of medical-related terminologies, calculated as the total number of terminology words divided by the total number of words. The inclusive criteria for medical terminology is the Chinese Medical Subject Headings [<xref ref-type="bibr" rid="ref18">18</xref>]. The subject headings and subheadings were considered as the medical terminology. Meantime, Chinese Medical Subject Headings is not updated simultaneously, so we further check out the SinoMed and PubMed MeSH Database as the complementary medical terminologies. Additionally, we considered the real-world use of some words commonly understood in daily life, such as &#x201C;sleep,&#x201D; &#x201C;health,&#x201D; &#x201C;disease,&#x201D; &#x201C;death,&#x201D; &#x201C;nutrition,&#x201D; &#x201C;medicine,&#x201D; &#x201C;vitamin,&#x201D; and &#x201C;infection,&#x201D; and some common diseases including &#x201C;hypertension,&#x201D; &#x201C;diabetes,&#x201D; and &#x201C;hyperlipidemia.&#x201D; Because the readability formula was suitable for persons with primary education [<xref ref-type="bibr" rid="ref17">17</xref>], the above words were considered as everyday words. All medical terminologies in doubt were resolved through group discussion.</p></sec><sec id="s2-3-4"><title>Applicability</title><p>Applicability refers to the suitability and feasibility of using the material for health science popularization. Applicability was evaluated by the Chinese Suitability Assessment of Materials (CSAM). The interrater reliability of the tool was 0.85, indicating high consistency among raters. Additionally, based on item response theory and generalizability theory, the tool demonstrated good structural validity and discriminant validity [<xref ref-type="bibr" rid="ref19">19</xref>]. Six dimensions were assessed: content, literacy demand, graphics, layout or typography, learning simulation, and cultural appropriateness. In total, the 22 items were scored on a 3-grade rating from 0 to 2. A total score was from 0 to 44, which showed the better suitability in a higher score, and a percentage (actual to total score) is determined with the results interpreted as follows: 70%-100% as very applicable (grade 1), 40%-69% as applicable (grade 2), and 0%-39% as not applicable (grade 3) [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref22">22</xref>]. In this study, the 2 GLLMs could provide text-only health material without graphics. Finally, 17 items in 5 dimensions were used to evaluate the material except the graphics part, with a total score of 34.</p><p>One researcher (YL) randomly sequenced the health essays. Two raters (YZ and JL) engaged in discussions to determine the final evaluation results. They were uncertain which GLLM had generated which health essay.</p></sec></sec><sec id="s2-4"><title>Analysis</title><p>SPSS (version 26.0; IBM Corp) was adopted to establish the cross-checking database by 2 reviewers (YL and YM) independently. Continuous data were expressed as mean and SD, and categorical data were expressed as frequency or percentage. According to the P-P plot test, the readability and applicability scores showed an approximately normal distribution. A 2-tailed <italic>t</italic> test was adopted to compare the differences in readability scores and applicability scores between the 2 models, and a chi-square test was used to compare the applicability grade. Further, a rank-sum test was selected to compare grade distribution differences among all items of the CSAM between the 2 models. Meanwhile, textual data (health essays) were qualitatively analyzed to further illustrate the differences between items. In addition, we selected the inductive content analysis [<xref ref-type="bibr" rid="ref23">23</xref>] to summarize the characteristics of the health essays.</p><p>According to related studies of the 2 GLLMs, asking questions in Chinese and English or repeating the same question twice may yield different answers [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. We further made postanalysis validation to analyze the stability of the 2 GLLMs. If the first response of GPT-4 is inaccurate, we will rephrase the question in English and ask again. Meanwhile, we repeated the same questions for both models to evaluate reproducibility. According to the related studies [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>], depending on the size of the dataset, 10%&#x2010;25% of data units would be typical. Although there is little consensus regarding the proportion of the data, we selected 25% of cases (5 rumors, n=20 and 3 truths, n=10).</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Accuracy</title><p>For GPT-4, the accuracy rates were 100% (20/20) for identifying rumors or misconceptions and 70% (7/10) for truths. Meanwhile, ERNIE Bot 4.0 achieved 100% accuracy rates for both rumors or misconceptions (20/20) and truths (10/10).</p><p>Among the cases not correctly identified, GPT-4 demonstrates hallucinations, revealed as inconsistencies between explanations and judgments [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. For another example, &#x201C;Drinking milk regularly can still lead to Vitamin D deficiency&#x201D; is a truth. The outputs of GPT-4 demonstrated that drinking milk alone might not be enough to meet the body&#x2019;s needs, but it thought this information was a rumor. Similarly, inaccuracies occurred in the identification of other truths.</p></sec><sec id="s3-2"><title>Effectiveness</title><p>Among the explanations, GPT-4 and ERNIE Bot 4.0 mostly provided widely recognized viewpoints. It is worth noting that the 2 models may provide criteria or indicators of health. For example, GPT-4 recommends an average daily water intake of about 2&#x2010;3 L for adults without any additional restrictions. ERNIE Bot 4.0 suggests that in mild climates, persons with light levels of physical activity need to drink 1500-1700 mL of plain water per day. In high temperatures or high levels of physical activity, a moderate increase in water intake is required. In addition, drinking water should be evenly distributed throughout the day to avoid excessive drinking at one time. Furthermore, it also stated that these recommendations come from the Chinese Dietary Guidelines, while the GPT-4 did not provide reference information. We further verified that the citation by ERNIE Bot 4.0 followed the recommendations of the guideline [<xref ref-type="bibr" rid="ref30">30</xref>]. In response to more specific questions, some suggestions were vague and unclear. For the explanation of &#x201C;Diabetic patients can eat fruit,&#x201D; GPT-4 only provided a general principle&#x2014;controlling blood sugar levels&#x2014;while ERNIE Bot 4.0 provided more specific requirements&#x2014;smooth control of postprandial blood glucose within 10 mmol/L&#x2014;which is in compliance with guidelines [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>].</p></sec><sec id="s3-3"><title>Readability</title><p>The readability scores of 30 health essays are presented in <xref ref-type="table" rid="table1">Table 1</xref>. The average <italic>R</italic> value for the health essays was 2.92 (SD 0.85) in GPT-4 and 3.02 (SD 0.84) in ERNIE Bot 4.0. There was no statistically significant difference between the 2 models (<italic>P</italic>=.65). For the total number of words, ERNIE Bot 4.0 produced longer essays than GPT-4 (<italic>P</italic>=.03). For the average sentence length, ERNIE Bot 4.0&#x2019;s sentences were shorter than GPT-4&#x2019;s (<italic>P</italic>&#x003C;.01). For comparisons of rumors or misconceptions and truths, respectively, please see Tables S1 and S2 in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>The readability scores of health essays generated by 2 generated large language models (n=30).</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Number<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="left" valign="bottom" colspan="2"><italic>X</italic><sub>1</sub><sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="bottom" colspan="2"><italic>X</italic><sub>2</sub><sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="bottom" colspan="2"><italic>X</italic><sub>3</sub><sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="bottom" colspan="2"><italic>R</italic><sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup></td></tr><tr><td align="left" valign="top"/><td align="left" valign="bottom">Bot 1<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup></td><td align="left" valign="bottom">Bot 2<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup></td><td align="left" valign="bottom">Bot 1</td><td align="left" valign="bottom">Bot 2</td><td align="left" valign="bottom">Bot 1</td><td align="left" valign="bottom">Bot 2</td><td align="left" valign="bottom">Bot 1</td><td align="left" valign="bottom">Bot 2</td></tr></thead><tbody><tr><td align="left" valign="top">1</td><td align="left" valign="top">550</td><td align="left" valign="top">531</td><td align="left" valign="top">30.56</td><td align="left" valign="top">31.24</td><td align="left" valign="top">0.06</td><td align="left" valign="top">0.07</td><td align="left" valign="top">2.96</td><td align="left" valign="top">3.19</td></tr><tr><td align="left" valign="top">2</td><td align="left" valign="top">461</td><td align="left" valign="top">497</td><td align="left" valign="top">28.81</td><td align="left" valign="top">26.16</td><td align="left" valign="top">0.09</td><td align="left" valign="top">0.05</td><td align="left" valign="top">3.12</td><td align="left" valign="top">2.39</td></tr><tr><td align="left" valign="top">3</td><td align="left" valign="top">500</td><td align="left" valign="top">445</td><td align="left" valign="top">31.25</td><td align="left" valign="top">26.18</td><td align="left" valign="top">0.05</td><td align="left" valign="top">0.08</td><td align="left" valign="top">2.65</td><td align="left" valign="top">2.90</td></tr><tr><td align="left" valign="top">4</td><td align="left" valign="top">566</td><td align="left" valign="top">574</td><td align="left" valign="top">33.29</td><td align="left" valign="top">26.09</td><td align="left" valign="top">0.07</td><td align="left" valign="top">0.07</td><td align="left" valign="top">3.25</td><td align="left" valign="top">3.03</td></tr><tr><td align="left" valign="top">5</td><td align="left" valign="top">544</td><td align="left" valign="top">501</td><td align="left" valign="top">28.63</td><td align="left" valign="top">26.37</td><td align="left" valign="top">0.03</td><td align="left" valign="top">0.02</td><td align="left" valign="top">2.34</td><td align="left" valign="top">1.89</td></tr><tr><td align="left" valign="top">6</td><td align="left" valign="top">542</td><td align="left" valign="top">619</td><td align="left" valign="top">36.13</td><td align="left" valign="top">32.58</td><td align="left" valign="top">0.02</td><td align="left" valign="top">0.06</td><td align="left" valign="top">2.36</td><td align="left" valign="top">3.12</td></tr><tr><td align="left" valign="top">7</td><td align="left" valign="top">565</td><td align="left" valign="top">552</td><td align="left" valign="top">33.24</td><td align="left" valign="top">30.67</td><td align="left" valign="top">0.10</td><td align="left" valign="top">0.06</td><td align="left" valign="top">3.80</td><td align="left" valign="top">3.03</td></tr><tr><td align="left" valign="top">8</td><td align="left" valign="top">557</td><td align="left" valign="top">457</td><td align="left" valign="top">30.94</td><td align="left" valign="top">20.77</td><td align="left" valign="top">0.07</td><td align="left" valign="top">0.05</td><td align="left" valign="top">3.15</td><td align="left" valign="top">2.13</td></tr><tr><td align="left" valign="top">9</td><td align="left" valign="top">453</td><td align="left" valign="top">690</td><td align="left" valign="top">25.17</td><td align="left" valign="top">32.86</td><td align="left" valign="top">0.09</td><td align="left" valign="top">0.10</td><td align="left" valign="top">3.07</td><td align="left" valign="top">4.13</td></tr><tr><td align="left" valign="top">10</td><td align="left" valign="top">570</td><td align="left" valign="top">696</td><td align="left" valign="top">31.67</td><td align="left" valign="top">32.26</td><td align="left" valign="top">0.13</td><td align="left" valign="top">0.11</td><td align="left" valign="top">4.28</td><td align="left" valign="top">4.24</td></tr><tr><td align="left" valign="top">11</td><td align="left" valign="top">490</td><td align="left" valign="top">439</td><td align="left" valign="top">37.70</td><td align="left" valign="top">32.87</td><td align="left" valign="top">0.06</td><td align="left" valign="top">0.08</td><td align="left" valign="top">3.12</td><td align="left" valign="top">3.24</td></tr><tr><td align="left" valign="top">12</td><td align="left" valign="top">488</td><td align="left" valign="top">423</td><td align="left" valign="top">28.71</td><td align="left" valign="top">24.88</td><td align="left" valign="top">0.05</td><td align="left" valign="top">0.09</td><td align="left" valign="top">2.61</td><td align="left" valign="top">2.87</td></tr><tr><td align="left" valign="top">13</td><td align="left" valign="top">454</td><td align="left" valign="top">588</td><td align="left" valign="top">26.71</td><td align="left" valign="top">29.40</td><td align="left" valign="top">0.06</td><td align="left" valign="top">0.10</td><td align="left" valign="top">2.51</td><td align="left" valign="top">3.68</td></tr><tr><td align="left" valign="top">14</td><td align="left" valign="top">480</td><td align="left" valign="top">502</td><td align="left" valign="top">26.67</td><td align="left" valign="top">27.89</td><td align="left" valign="top">0.17</td><td align="left" valign="top">0.14</td><td align="left" valign="top">4.54</td><td align="left" valign="top">4.26</td></tr><tr><td align="left" valign="top">15</td><td align="left" valign="top">419</td><td align="left" valign="top">535</td><td align="left" valign="top">29.93</td><td align="left" valign="top">28.16</td><td align="left" valign="top">0.07</td><td align="left" valign="top">0.11</td><td align="left" valign="top">2.79</td><td align="left" valign="top">3.64</td></tr><tr><td align="left" valign="top">16</td><td align="left" valign="top">526</td><td align="left" valign="top">554</td><td align="left" valign="top">35.07</td><td align="left" valign="top">26.38</td><td align="left" valign="top">0.15</td><td align="left" valign="top">0.16</td><td align="left" valign="top">4.83</td><td align="left" valign="top">4.56</td></tr><tr><td align="left" valign="top">17</td><td align="left" valign="top">434</td><td align="left" valign="top">490</td><td align="left" valign="top">36.17</td><td align="left" valign="top">27.22</td><td align="left" valign="top">0.03</td><td align="left" valign="top">0.04</td><td align="left" valign="top">2.29</td><td align="left" valign="top">2.24</td></tr><tr><td align="left" valign="top">18</td><td align="left" valign="top">465</td><td align="left" valign="top">530</td><td align="left" valign="top">33.21</td><td align="left" valign="top">24.09</td><td align="left" valign="top">0.03</td><td align="left" valign="top">0.06</td><td align="left" valign="top">2.37</td><td align="left" valign="top">2.67</td></tr><tr><td align="left" valign="top">19</td><td align="left" valign="top">494</td><td align="left" valign="top">460</td><td align="left" valign="top">30.88</td><td align="left" valign="top">27.06</td><td align="left" valign="top">0.03</td><td align="left" valign="top">0.07</td><td align="left" valign="top">2.33</td><td align="left" valign="top">2.80</td></tr><tr><td align="left" valign="top">20</td><td align="left" valign="top">512</td><td align="left" valign="top">504</td><td align="left" valign="top">34.13</td><td align="left" valign="top">29.65</td><td align="left" valign="top">0.16</td><td align="left" valign="top">0.19</td><td align="left" valign="top">4.86</td><td align="left" valign="top">5.20</td></tr><tr><td align="left" valign="top">21</td><td align="left" valign="top">479</td><td align="left" valign="top">478</td><td align="left" valign="top">26.61</td><td align="left" valign="top">28.12</td><td align="left" valign="top">0.03</td><td align="left" valign="top">0.05</td><td align="left" valign="top">2.05</td><td align="left" valign="top">2.54</td></tr><tr><td align="left" valign="top">22</td><td align="left" valign="top">520</td><td align="left" valign="top">677</td><td align="left" valign="top">30.59</td><td align="left" valign="top">30.77</td><td align="left" valign="top">0.00</td><td align="left" valign="top">0.02</td><td align="left" valign="top">1.79</td><td align="left" valign="top">2.45</td></tr><tr><td align="left" valign="top">23</td><td align="left" valign="top">641</td><td align="left" valign="top">534</td><td align="left" valign="top">30.52</td><td align="left" valign="top">23.22</td><td align="left" valign="top">0.01</td><td align="left" valign="top">0.07</td><td align="left" valign="top">2.19</td><td align="left" valign="top">2.80</td></tr><tr><td align="left" valign="top">24</td><td align="left" valign="top">496</td><td align="left" valign="top">415</td><td align="left" valign="top">33.07</td><td align="left" valign="top">24.41</td><td align="left" valign="top">0.01</td><td align="left" valign="top">0.02</td><td align="left" valign="top">1.99</td><td align="left" valign="top">1.58</td></tr><tr><td align="left" valign="top">25</td><td align="left" valign="top">433</td><td align="left" valign="top">804</td><td align="left" valign="top">28.87</td><td align="left" valign="top">27.72</td><td align="left" valign="top">0.07</td><td align="left" valign="top">0.02</td><td align="left" valign="top">2.82</td><td align="left" valign="top">2.73</td></tr><tr><td align="left" valign="top">26</td><td align="left" valign="top">405</td><td align="left" valign="top">632</td><td align="left" valign="top">27.00</td><td align="left" valign="top">31.60</td><td align="left" valign="top">0.10</td><td align="left" valign="top">0.06</td><td align="left" valign="top">3.12</td><td align="left" valign="top">3.23</td></tr><tr><td align="left" valign="top">27</td><td align="left" valign="top">487</td><td align="left" valign="top">752</td><td align="left" valign="top">30.44</td><td align="left" valign="top">30.08</td><td align="left" valign="top">0.01</td><td align="left" valign="top">0.00</td><td align="left" valign="top">1.78</td><td align="left" valign="top">2.32</td></tr><tr><td align="left" valign="top">28</td><td align="left" valign="top">495</td><td align="left" valign="top">384</td><td align="left" valign="top">30.94</td><td align="left" valign="top">20.21</td><td align="left" valign="top">0.03</td><td align="left" valign="top">0.07</td><td align="left" valign="top">2.34</td><td align="left" valign="top">2.25</td></tr><tr><td align="left" valign="top">29</td><td align="left" valign="top">536</td><td align="left" valign="top">569</td><td align="left" valign="top">35.73</td><td align="left" valign="top">28.45</td><td align="left" valign="top">0.02</td><td align="left" valign="top">0.01</td><td align="left" valign="top">2.40</td><td align="left" valign="top">2.01</td></tr><tr><td align="left" valign="top">30</td><td align="left" valign="top">528</td><td align="left" valign="top">688</td><td align="left" valign="top">33.00</td><td align="left" valign="top">29.91</td><td align="left" valign="top">0.11</td><td align="left" valign="top">0.07</td><td align="left" valign="top">3.83</td><td align="left" valign="top">3.44</td></tr><tr><td align="left" valign="top">Average (SD)</td><td align="left" valign="top">503.00 (52.09)</td><td align="left" valign="top">550.66 (104.54)</td><td align="left" valign="top">31.19 (3.21)</td><td align="left" valign="top">27.91 (3.36)</td><td align="left" valign="top">0.06 (0.05)</td><td align="left" valign="top">0.07 (0.04)</td><td align="left" valign="top">2.92 (0.85)</td><td align="left" valign="top">3.02 (0.84)</td></tr><tr><td align="left" valign="top"><italic>t</italic> test (<italic>df</italic>=29)</td><td align="left" valign="top">2.235</td><td align="left" valign="top">2.235</td><td align="left" valign="top">&#x2212;3.864</td><td align="left" valign="top">&#x2212;3.864</td><td align="left" valign="top">0.618</td><td align="left" valign="top">0.618</td><td align="left" valign="top">0.460</td><td align="left" valign="top">0.460</td></tr><tr><td align="left" valign="top"><italic>P</italic> value</td><td align="left" valign="top">.03</td><td align="left" valign="top">.03</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">.47</td><td align="left" valign="top">.47</td><td align="left" valign="top">.65</td><td align="left" valign="top">.65</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>Numbers 1-20: health science popularization essays based on rumors. Numbers 21-30: health science popularization essays based on truths.</p></fn><fn id="table1fn2"><p><sup>b</sup><italic>X</italic><sub>1</sub>: total number of words.</p></fn><fn id="table1fn3"><p><sup>c</sup><italic>X</italic><sub>2</sub>: average sentence length.</p></fn><fn id="table1fn4"><p><sup>d</sup><italic>X</italic><sub>3</sub>: percentage of medical-related terminologies.</p></fn><fn id="table1fn5"><p><sup>e</sup><italic>R</italic>: readability score.</p></fn><fn id="table1fn6"><p><sup>f</sup>Bot 1: GPT-4.</p></fn><fn id="table1fn7"><p><sup>g</sup>Bot 2: Enhanced Representation through Knowledge Integration Bot 4.0.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-4"><title>Applicability</title><p>The CSAM scores of 30 health essays are presented in <xref ref-type="table" rid="table2">Table 2</xref>, and the grade is presented in <xref ref-type="table" rid="table3">Table 3</xref>. Except for the content and cultural appropriateness, significant differences were observed in the total score and scores in other dimensions between the 2 GLLMs (<italic>P</italic>&#x003C;.05). Generally, the scores of ERNIE Bot 4.0 were higher than those of GPT-4 except for layout or typography. Among the CSAM grades, significant differences were only found in the learning stimulation dimension (<italic>P</italic>=.003). The item score grade distribution is presented in <xref ref-type="table" rid="table4">Table 4</xref> and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>. Significant grade distribution differences were observed in items b3, b5, d3, and e2 (<italic>P</italic>&#x003C;.05).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>The CSAM<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> score of health essays generated by 2 GLLMs<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup> (n=30).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Dimension</td><td align="left" valign="bottom" colspan="2">Score</td><td align="left" valign="bottom"><italic>t</italic> test (<italic>df=</italic>29)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr><tr><td align="left" valign="top"/><td align="left" valign="bottom">Bot 1<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup>, mean (SD)</td><td align="left" valign="bottom">Bot 2<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup>, mean (SD)</td><td align="left" valign="top"/><td align="left" valign="top"/></tr></thead><tbody><tr><td align="left" valign="top">Content</td><td align="left" valign="top">7.47 (0.50)</td><td align="left" valign="top">7.70 (0.47)</td><td align="left" valign="top">&#x2212;1.855</td><td align="left" valign="top">.07</td></tr><tr><td align="left" valign="top">Literacy demand</td><td align="left" valign="top">7.87 (1.04)</td><td align="left" valign="top">8.57 (0.68)</td><td align="left" valign="top">&#x2212;3.084</td><td align="left" valign="top">.003</td></tr><tr><td align="left" valign="top">Layout or typography</td><td align="left" valign="top">3.53 (0.82)</td><td align="left" valign="top">2.97 (0.93)</td><td align="left" valign="top">2.507</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top">Learning stimulation</td><td align="left" valign="top">3.63 (1.03)</td><td align="left" valign="top">4.33 (0.71)</td><td align="left" valign="top">&#x2212;3.056</td><td align="left" valign="top">.003</td></tr><tr><td align="left" valign="top">Cultural appropriateness</td><td align="left" valign="top">3.40 (0.56)</td><td align="left" valign="top">3.57 (0.50)</td><td align="left" valign="top">&#x2212;1.208</td><td align="left" valign="top">.23</td></tr><tr><td align="left" valign="top">Total</td><td align="left" valign="top">25.90 (2.29)</td><td align="left" valign="top">27.13 (1.94)</td><td align="left" valign="top">&#x2212;2.247</td><td align="left" valign="top">.03</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>CSAM: Chinese Suitability Assessment of Materials.</p></fn><fn id="table2fn2"><p><sup>b</sup>GLLM: generated large language model.</p></fn><fn id="table2fn3"><p><sup>c</sup>Bot 1: GPT-4.</p></fn><fn id="table2fn4"><p><sup>d</sup>Bot 2: Enhanced Representation through Knowledge Integration Bot 4.0.</p></fn></table-wrap-foot></table-wrap><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>The CSAM<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> grade of health essays generated by 2 GLLMs<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> (n=30)<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup>.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Dimension</td><td align="left" valign="bottom" colspan="3">Bot 1<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td><td align="left" valign="bottom" colspan="3">Bot 2<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup></td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Grade 1</td><td align="left" valign="bottom">Grade 2</td><td align="left" valign="bottom">Grade 3</td><td align="left" valign="bottom">Grade 1</td><td align="left" valign="bottom">Grade 2</td><td align="left" valign="bottom">Grade 3</td></tr></thead><tbody><tr><td align="left" valign="top">Content<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td><td align="left" valign="top">30</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td><td align="left" valign="top">30</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Literacy demand<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td><td align="left" valign="top">26</td><td align="left" valign="top">4</td><td align="left" valign="top">0</td><td align="left" valign="top">30</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Layout or typography<sup><xref ref-type="table-fn" rid="table3fn7">g</xref></sup></td><td align="left" valign="top">0</td><td align="left" valign="top">24</td><td align="left" valign="top">6</td><td align="left" valign="top">0</td><td align="left" valign="top">17</td><td align="left" valign="top">13</td></tr><tr><td align="left" valign="top">Learning stimulation<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup><sup>,</sup><sup><xref ref-type="table-fn" rid="table3fn8">h</xref></sup></td><td align="left" valign="top">6</td><td align="left" valign="top">20</td><td align="left" valign="top">4</td><td align="left" valign="top">14</td><td align="left" valign="top">16</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Cultural appropriateness<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td><td align="left" valign="top">29</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td><td align="left" valign="top">30</td><td align="left" valign="top">0</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Total<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td><td align="left" valign="top">26</td><td align="left" valign="top">4</td><td align="left" valign="top">0</td><td align="left" valign="top">29</td><td align="left" valign="top">1</td><td align="left" valign="top">0</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>CSAM: Chinese Suitability Assessment of Materials.</p></fn><fn id="table3fn2"><p><sup>b</sup>GLLM: generated large language model.</p></fn><fn id="table3fn3"><p><sup>c</sup>The percentage (actual to total score) is determined with the results interpreted as follows: 70%-100% as very applicable (grade 1), 40%-69% as applicable (grade 2), and 0%-39% as not applicable (grade 3).</p></fn><fn id="table3fn4"><p><sup>d</sup>Bot 1: GPT-4.</p></fn><fn id="table3fn5"><p><sup>e</sup>Bot 2: Enhanced Representation through Knowledge Integration Bot 4.0.</p></fn><fn id="table3fn6"><p><sup>f</sup>Fisher exact text.</p></fn><fn id="table3fn7"><p><sup>g</sup>Chi-square text</p></fn><fn id="table3fn8"><p><sup>h</sup><italic>P</italic>&#x003C;.05.</p></fn></table-wrap-foot></table-wrap><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>The CSAM<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> item score of health essays generated by 2 GLLMs<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup> (n=30)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup>.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Item</td><td align="left" valign="bottom">Bot 1<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup>, mean rank</td><td align="left" valign="bottom">Bot 2<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup>, mean rank</td><td align="left" valign="bottom"><italic>Z</italic> value</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">a1<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup></td><td align="left" valign="top">30.50</td><td align="left" valign="top">30.50</td><td align="left" valign="top">&#x003C;0.001</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top">a2<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup></td><td align="left" valign="top">27.00</td><td align="left" valign="top">34.00</td><td align="left" valign="top">&#x2212;1.818</td><td align="left" valign="top">.07</td></tr><tr><td align="left" valign="top">a3<sup><xref ref-type="table-fn" rid="table4fn8">h</xref></sup></td><td align="left" valign="top">30.50</td><td align="left" valign="top">30.50</td><td align="left" valign="top">&#x003C;0.001</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top">a4<sup><xref ref-type="table-fn" rid="table4fn9">i</xref></sup></td><td align="left" valign="top">30.50</td><td align="left" valign="top">30.50</td><td align="left" valign="top">&#x003C;0.001</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top">b1<sup><xref ref-type="table-fn" rid="table4fn10">j</xref></sup></td><td align="left" valign="top">31.00</td><td align="left" valign="top">30.00</td><td align="left" valign="top">&#x2212;1.000</td><td align="left" valign="top">.32</td></tr><tr><td align="left" valign="top">b2<sup><xref ref-type="table-fn" rid="table4fn11">k</xref></sup></td><td align="left" valign="top">30.50</td><td align="left" valign="top">30.50</td><td align="left" valign="top">&#x003C;0.001</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top">b3<sup><xref ref-type="table-fn" rid="table4fn12">l</xref></sup></td><td align="left" valign="top">27.00</td><td align="left" valign="top">34.00</td><td align="left" valign="top">&#x2212;2.316</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top">b4<sup><xref ref-type="table-fn" rid="table4fn13">m</xref></sup></td><td align="left" valign="top">28.00</td><td align="left" valign="top">33.00</td><td align="left" valign="top">&#x2212;1.376</td><td align="left" valign="top">.17</td></tr><tr><td align="left" valign="top">b5<sup><xref ref-type="table-fn" rid="table4fn14">n</xref></sup></td><td align="left" valign="top">26.85</td><td align="left" valign="top">34.15</td><td align="left" valign="top">&#x2212;2.256</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top">d1<sup><xref ref-type="table-fn" rid="table4fn15">o</xref></sup></td><td align="left" valign="top">30.50</td><td align="left" valign="top">30.50</td><td align="left" valign="top">&#x003C;0.001</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top">d2<sup><xref ref-type="table-fn" rid="table4fn16">p</xref></sup></td><td align="left" valign="top">30.50</td><td align="left" valign="top">30.50</td><td align="left" valign="top">&#x003C;0.001</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top">d3<sup><xref ref-type="table-fn" rid="table4fn17">q</xref></sup></td><td align="left" valign="top">35.43</td><td align="left" valign="top">25.57</td><td align="left" valign="top">&#x2212;2.470</td><td align="left" valign="top">.01</td></tr><tr><td align="left" valign="top">e1<sup><xref ref-type="table-fn" rid="table4fn18">r</xref></sup></td><td align="left" valign="top">28.00</td><td align="left" valign="top">33.00</td><td align="left" valign="top">&#x2212;1.376</td><td align="left" valign="top">.17</td></tr><tr><td align="left" valign="top">e2<sup><xref ref-type="table-fn" rid="table4fn19">s</xref></sup></td><td align="left" valign="top">25.37</td><td align="left" valign="top">35.63</td><td align="left" valign="top">&#x2212;2.850</td><td align="left" valign="top">.004</td></tr><tr><td align="left" valign="top">e3<sup><xref ref-type="table-fn" rid="table4fn20">t</xref></sup></td><td align="left" valign="top">29.27</td><td align="left" valign="top">31.73</td><td align="left" valign="top">&#x2212;0.682</td><td align="left" valign="top">.496</td></tr><tr><td align="left" valign="top">f1<sup><xref ref-type="table-fn" rid="table4fn21">u</xref></sup></td><td align="left" valign="top">30.50</td><td align="left" valign="top">30.50</td><td align="left" valign="top">&#x003C;0.001</td><td align="left" valign="top">&#x003E;.99</td></tr><tr><td align="left" valign="top">f2<sup><xref ref-type="table-fn" rid="table4fn22">v</xref></sup></td><td align="left" valign="top">28.28</td><td align="left" valign="top">32.72</td><td align="left" valign="top">&#x2212;1.126</td><td align="left" valign="top">.26</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>CSAM: Chinese Suitability Assessment of Materials.</p></fn><fn id="table4fn2"><p><sup>b</sup>GLLM: generated large language model.</p></fn><fn id="table4fn3"><p><sup>c</sup>Mann-Whitney <italic>U</italic> test was used to compare between the 2 GLLMs.</p></fn><fn id="table4fn4"><p><sup>d</sup>Bot 1: GPT-4.</p></fn><fn id="table4fn5"><p><sup>e</sup>Bot 2: Enhanced Representation through Knowledge Integration Bot 4.0.</p></fn><fn id="table4fn6"><p><sup>f</sup>a1: purpose is evident.</p></fn><fn id="table4fn7"><p><sup>g</sup>a2: content about behaviors.</p></fn><fn id="table4fn8"><p><sup>h</sup>a3: scope is limited.</p></fn><fn id="table4fn9"><p><sup>i</sup>a4: summary or review included.</p></fn><fn id="table4fn10"><p><sup>j</sup>b1: reading grade level</p></fn><fn id="table4fn11"><p><sup>k</sup>b2: writing style, active voice</p></fn><fn id="table4fn12"><p><sup>l</sup>b3: context is given first</p></fn><fn id="table4fn13"><p><sup>m</sup>b4: vocabulary.</p></fn><fn id="table4fn14"><p><sup>n</sup>b5: road signs.</p></fn><fn id="table4fn15"><p><sup>o</sup>d1: layout factors.</p></fn><fn id="table4fn16"><p><sup>p</sup>d2: typography.</p></fn><fn id="table4fn17"><p><sup>q</sup>d3: subheadings used.</p></fn><fn id="table4fn18"><p><sup>r</sup>e1: interaction used.</p></fn><fn id="table4fn19"><p><sup>s</sup>e2: behaviors are modeled and specific.</p></fn><fn id="table4fn20"><p><sup>t</sup>e3: motivation.</p></fn><fn id="table4fn21"><p><sup>u</sup>f1: match in logic, language, experience.</p></fn><fn id="table4fn22"><p><sup>v</sup>f2: cultural image and examples.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-5"><title>Characteristics of the Health Essays</title><sec id="s3-5-1"><title>Use of Subheadings</title><p>GPT-4 tends to use subheadings. Among the 30 health essays, GPT-4 incorporated the subheading format in a total of 24 papers, whereas ERNIE Bot 4.0 opted for subheadings in 13 papers. Meanwhile, GPT-4 scored higher on item d3 (subheadings used) of the CSAM, indicating the frequent use of subheadings, without statistical significance (<xref ref-type="table" rid="table4">Table 4</xref> and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>).</p></sec><sec id="s3-5-2"><title>Interaction Mode</title><p>Two GLLMs prefer to ask and answer themselves and sometimes write lengthy explanatory or illustrative texts that lack subheadings. In health science popularization, it is not only necessary to give readers the correct answers but also to constantly stimulate readers to think [<xref ref-type="bibr" rid="ref33">33</xref>]. Meanwhile, ERNIE Bot 4.0 scored higher than GPT-4 in item e1 (interaction used) of the CSAM without statistical significance (<xref ref-type="table" rid="table4">Table 4</xref> and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>).</p></sec><sec id="s3-5-3"><title>Linguistic Habits</title><p>The advantage of the 2 GLLMs is their preference for the active voice. In Chinese, active voice typically conforms to linguistic conventions. Comparatively speaking, simple sentences are more commonly used in the responses of ERNIE Bot 4.0, while GPT-4 tends to use compound sentences more often. Therefore, ERNIE Bot 4.0 conforms to Chinese language conventions. Furthermore, GPT-4 generates texts with grammatical problems.</p></sec><sec id="s3-5-4"><title>Content</title><p>First, GPT-4 tends to respond more frequently (13 times) to phrases like &#x201C;the research showed that...&#x201D; or &#x201C;Experts suggest or recommend that...&#x201D; compared to ERNIE Bot 4.0, which used such phrases less often (4 times). Furthermore, neither GPT-4 nor ERNIE Bot 4.0 provided references or citations for these recommendations.</p><p>Second, 2 GLLMs can provide specific cutoff points such as water intake. ERNIE Bot 4.0 stated that these recommendations were from the Chinese Dietary Guidelines, but GPT-4 did not provide the original source. However, it is important to note that even ERNIE Bot 4.0 can sometimes fail to cite its sources adequately. For example, a daily intake of 300 g of cooked white rice may serve as a cutoff point, above which the risk of developing type 2 diabetes increases by 13% with every additional intake of 158 g. While this statement appears comprehensive, the lack of an original source leaves us with no way to verify the conclusion.</p></sec></sec><sec id="s3-6"><title>Postanalysis Validation</title><p>Considering the potential impact of language [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref24">24</xref>], 2 weeks later after the first questioning, we asked GPT-4 in English and received its English response for the truths not correctly identified. However, GPT-4 still responded that &#x201C;Drinking milk regularly can still lead to Vitamin D deficiency&#x201D; was a rumor, despite the English explanations were accurate. For other truths, GPT-4 still replied &#x201C;it is a topic of debate.&#x201D;</p><p>When the same question is submitted twice, it is a possibility that the 2 responses generated may not be similar before and after the second submission [<xref ref-type="bibr" rid="ref25">25</xref>]. Further, we asked the same questions to the 2 models again from January 23 to 24, 2024. Notably, GPT-4 expressed differential opinions in its 2 responses for the same case (&#x201C;Eating more spinach for iron supplements&#x201D;). In the first time, GPT-4 argued that the viewpoint was inaccurate, whereas, in the second time, it considered the view correct. The 2 explanations were consistent, both agreeing that the viewpoint was theoretically feasible but had little effect in practice. Overall, among other cases, there was consistency in the 2 time-point responses with some differences in detail. For instance, about a truth&#x2014;&#x201C;You can drink milk on an empty stomach&#x201D;&#x2014;in comparison with the first response, GPT-4 added an explanation about food culture.</p><p>In the second response, ERNIE Bot 4.0 accurately identified the rumor or misconception, and while the 2 explanations were similar overall, the second one was longer and included more details. For the truth that &#x201C;You can drink milk on an empty stomach,&#x201D; the second response provided additional information, covering special situations like lactose intolerance. When it came to the rumor that &#x201C;Sunlight through glass windows can replenish calcium,&#x201D; the second response not only explained the cause but also offered dietary advice. Interestingly, in debunking the rumor that &#x201C;Drinking more water is healthier,&#x201D; the first response mentioned the recommendation of Chinese Dietary Guidelines, but it disappeared in the second response. This inconsistency might suggest randomness in their responses.</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>When comparing GPT-4 and ERNIE Bot 4.0, both performed well in identifying rumors or misconceptions, but GPT-4 demonstrated hallucinations. Notably, both models provided comprehensive explanations. However, they rarely provided supporting citations for their viewpoints. On the CIDP, without proven scientific evidence, it has been recognized as a rumor and could mislead the public. The unconfirmed information is shared on the web as if it were accurate information, sometimes going viral and causing widespread anxiety or leading to misinformation-based beliefs [<xref ref-type="bibr" rid="ref34">34</xref>].</p><p>For recommendations and viewpoints provided by the 2 GLLMs, we further asked them to offer references or citations. Regrettably, the 2 models indicated that they were unable to provide accurate source material, but they sometimes could provide vague references. Upon further verification, we found that the references cited as evidence were either full of mistakes or completely fabricated. This is consistent with previous studies conducted on earlier versions of ChatGPT [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. Our findings suggest that the same problem still persists on GPT-4 and ERNIE Bot 4.0. Especially, the provided numerical values should be carefully examined. The value may be from nonauthoritative reports [<xref ref-type="bibr" rid="ref25">25</xref>]. Nevertheless, the 2 models usually provide widely recognized viewpoints, and the recommended healthy lifestyles are also aligned with the guidelines. Overall, despite limitations, they can achieve the effectiveness of science popularization for the general public in the situation that there is no health care professional to judge information.</p><p>Readability is a critical factor in comprehension, which refers to how well a passage of text can be read and understood by an individual [<xref ref-type="bibr" rid="ref37">37</xref>]. For low literacy skills, a fifth-grade level or lower is more suitable [<xref ref-type="bibr" rid="ref38">38</xref>]. Obviously, the essays generated by the 2 GLLMs met the requirements in reading level (<xref ref-type="table" rid="table1">Table 1</xref>). In our study, although the readability scores of the 2 GLLMs were not statistically different, ERNIE Bot 4.0 generated longer text than GPT-4 (<xref ref-type="table" rid="table1">Table 1</xref>). For an individual with lower literacy skills, longer text may lead to loss of interest and even cause reading difficulties. The related studies have proved that GLLMs can provide simplified text, but understanding this text still requires a certain level of education [<xref ref-type="bibr" rid="ref39">39</xref>-<xref ref-type="bibr" rid="ref41">41</xref>]. Additionally, reading fluency is an essential aspect of the overall reading experience. The grammatical issues in GPT-4 cannot be overlooked, and GPT-4 tends to generate longer sentences than ERNIE Bot 4.0 (<italic>P</italic>&#x003C;.001; <xref ref-type="table" rid="table1">Table 1</xref>). This suggests that texts by ERNIE Bot 4.0 may be easier to read. Nevertheless, text easiness showed no influence on trustworthiness, and the public may still blindly believe this content [<xref ref-type="bibr" rid="ref42">42</xref>]. Considering the randomness of the responses provided by the 2 models, caution should be made when taking their advice.</p><p>ERNIE Bot 4.0 was better than GPT-4 in item b3 (context is given first; <italic>P</italic>=.02) and b5 (road signs; <italic>P</italic>=.02; <xref ref-type="table" rid="table4">Table 4</xref> and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). The context is given before new information. We learn new facts or behaviors more quickly when told the context first. Meanwhile, headers or topic captions tell very briefly what is coming next. These &#x201C;road signs&#x201D; make the text look less intimidating and prepare the reader&#x2019;s thought process to expect the announced topic [<xref ref-type="bibr" rid="ref38">38</xref>]. GPT-4 performed better than ERNIE Bot 4.0 in item d3 (subheadings used; <italic>P</italic>=.01; <xref ref-type="table" rid="table4">Table 4</xref> and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). Longer texts need to be partitioned into smaller chunks. Subheadings can help readers quickly understand the core content of each chunk [<xref ref-type="bibr" rid="ref38">38</xref>]. In item e2 (behaviors are modeled and specific), ERNIE Bot 4.0 performed better than GPT-4 (<italic>P</italic>=.004; <xref ref-type="table" rid="table4">Table 4</xref> and <xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). People often learn more readily when specific, familiar instances are used rather than abstract or general concepts [<xref ref-type="bibr" rid="ref38">38</xref>]. When presented with the health essay &#x201C;There is no standard for the ideal time of sleep,&#x201D; GPT-4 explained more about factors affecting sleep duration. In contrast, ERNIE Bot 4.0 dedicated approximately 50% of its response to helping individuals determine the appropriate length of sleep for themselves.</p><p>One of GLLM&#x2019;s strengths is its ability to sift through massive amounts of information and produce responses in a conversational and easy-to-understand manner. In contrast, search results from current search engines can often be overwhelming for the general public, frequently filled with irrelevant or misleading information [<xref ref-type="bibr" rid="ref25">25</xref>]. However, as ChatGPT and ERNIE Bot are specifically designed for conversational dialogue, their responses can be more comprehensible than those found in professional guidelines or literature. The study showed that, after reading popularized papers addressed to a lay audience, lay readers agreed more with the knowledge claims presented in those papers and were more confident in their claim judgments than after reading papers addressed to expert readers [<xref ref-type="bibr" rid="ref43">43</xref>]. In our study, we found that the 2 GLLMs provided easy-to-understand information. However, the information might be superficial or nonspecific with errors. Therefore, if someone agrees with the idea because of the model&#x2019;s response, the misleading information spreads widely on the web possibly [<xref ref-type="bibr" rid="ref44">44</xref>].</p><p>Another key element for health education is stimulation and motivation. Interaction, in particular, plays a crucial role in health education or popularization. We suggest that a questioning format should be used to keep the reader recalling the educational content. In the health essays provided by the 2 models, a question-and-answer format was used, which involved posing a question and then promptly providing the corresponding answer. Even though it is a passive interaction, it is still more effective in reminding readers to focus on the following answers than long explanatory or illustrative texts. Meanwhile, it is recommended that both models successfully break down complex topics. This not only makes the materials more understandable but also allows the readers to explore the logic of cause and effect. When people believe tasks and behaviors are valuable and practicable, they will be motivated to learn [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref45">45</xref>].</p><p>This study has some limitations. First, due to time constraints, we were unable to use all the cases in the rumor library. We chose typical recent cases to test their ability as in previous studies. Second, the readability formula is a general tool. In the future, it is worth exploring to develop the specific tool for Chinese medical materials. Third, the CSAM can help you save time and money and improve program effectiveness by selecting or producing materials that the public is likely to pick up, read, understand, and act on. The CSAM cannot substitute for formative research and testing, through which the public confirms that the information is attractive, useful, and persuasive to them. Fourth, the 2 GLLMs do not provide graphics. In many works of scientific popularization, graphic is an important tool to help readers understand. However, with the emergence of GLLMs&#x2019; capability to generate graphics, we need to explore whether this function can assist in science popularization further in depth. Fifth, this study was to compare 2 GLLMs. With more and more GLLMs being developed, future research can further explore the applicability of them in the Chinese context. Finally, this study focuses more on the Chinese context. Future exploration will be to include more linguistics experts to jointly discuss the impact of different languages on large language models.</p></sec><sec id="s4-2"><title>Conclusions</title><p>ERNIE Bot 4.0 demonstrated similar accuracy to GPT-4 in identifying Chinese rumors. Notably, the 2 GLLMs mostly provided widely recognized viewpoints, despite potential inaccuracies and superficiality. When it comes to the health essays, nurses can learn from the linguistic strengths that facilitate readability and comprehension. However, the content needs to be checked by experts for appropriateness and accuracy. Additionally, ERNIE Bot 4.0 aligns well with Chinese expression habits, making it a suitable choice for those seeking an enhanced Chinese reading experience.</p></sec></sec></body><back><ack><p>This research was supported by the Key Program of the National Natural Science Foundation of China (72034005).</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated and analyzed during this study are available from the corresponding author on reasonable request.</p></sec></notes><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">CIDP</term><def><p>China Internet Disinformation Platform</p></def></def-item><def-item><term id="abb2">CSAM</term><def><p>Chinese Suitability Assessment of Materials</p></def></def-item><def-item><term id="abb3">ERNIE Bot</term><def><p>Enhanced Representation through Knowledge Integration Bot</p></def></def-item><def-item><term id="abb4">GLLM</term><def><p>generated large language model</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>F</given-names> </name><name name-style="western"><surname>Ren</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>X</given-names> </name></person-group><article-title>Health-related rumor control through social collaboration models: lessons from cases in China during the COVID-19 pandemic</article-title><source>Healthcare (Basel)</source><year>2022</year><month>08</month><day>5</day><volume>10</volume><issue>8</issue><fpage>1475</fpage><pub-id pub-id-type="doi">10.3390/healthcare10081475</pub-id><pub-id pub-id-type="medline">36011131</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fazio</surname><given-names>LK</given-names> </name><name name-style="western"><surname>Brashier</surname><given-names>NM</given-names> </name><name name-style="western"><surname>Payne</surname><given-names>BK</given-names> </name><name name-style="western"><surname>Marsh</surname><given-names>EJ</given-names> </name></person-group><article-title>Knowledge does not protect against illusory truth</article-title><source>J Exp Psychol Gen</source><year>2015</year><month>10</month><volume>144</volume><issue>5</issue><fpage>993</fpage><lpage>1002</lpage><pub-id pub-id-type="doi">10.1037/xge0000098</pub-id><pub-id pub-id-type="medline">26301795</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Arora</surname><given-names>N</given-names></name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Biswas</surname><given-names>A</given-names> </name><name name-style="western"><surname>Patgiri</surname><given-names>R</given-names> </name><name name-style="western"><surname>Biswas</surname><given-names>B</given-names> </name></person-group><article-title>Fake news and rumor detection</article-title><source>Principles of Social Networking: The New Horizon and Emerging Challenges</source><year>2022</year><publisher-name>Springer Singapore</publisher-name><fpage>307</fpage><lpage>324</lpage><pub-id pub-id-type="doi">10.1007/978-981-16-3398-0_14</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhuang</surname><given-names>W</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Wei</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Misconception contributed to COVID-19 vaccine hesitancy in patients with lung cancer or ground-glass opacity: a cross-sectional study of 324 Chinese patients</article-title><source>Hum Vaccin Immunother</source><year>2021</year><month>12</month><day>2</day><volume>17</volume><issue>12</issue><fpage>5016</fpage><lpage>5023</lpage><pub-id pub-id-type="doi">10.1080/21645515.2021.1992212</pub-id><pub-id pub-id-type="medline">34715002</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bakebillah</surname><given-names>M</given-names> </name><name name-style="western"><surname>Billah</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Wubishet</surname><given-names>BL</given-names> </name><name name-style="western"><surname>Khan</surname><given-names>MN</given-names> </name></person-group><article-title>Community&#x2019;s misconception about COVID-19 and its associated factors in Satkhira, Bangladesh: a cross-sectional study</article-title><source>PLoS One</source><year>2021</year><volume>16</volume><issue>9</issue><fpage>e0257410</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0257410</pub-id><pub-id pub-id-type="medline">34506614</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Li</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Qiu</surname><given-names>C</given-names> </name></person-group><article-title>A rumor reversal model of online health information during the Covid-19 epidemic</article-title><source>Inf Process Manag</source><year>2021</year><month>11</month><volume>58</volume><issue>6</issue><fpage>102731</fpage><pub-id pub-id-type="doi">10.1016/j.ipm.2021.102731</pub-id><pub-id pub-id-type="medline">34539040</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zou</surname><given-names>W</given-names> </name><name name-style="western"><surname>Tang</surname><given-names>L</given-names> </name></person-group><article-title>What do we believe in? Rumors and processing strategies during the COVID-19 outbreak in China</article-title><source>Public Underst Sci</source><year>2021</year><month>02</month><volume>30</volume><issue>2</issue><fpage>153</fpage><lpage>168</lpage><pub-id pub-id-type="doi">10.1177/0963662520979459</pub-id><pub-id pub-id-type="medline">33353491</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tan</surname><given-names>EY</given-names> </name><name name-style="western"><surname>Albarazi</surname><given-names>D</given-names> </name><name name-style="western"><surname>Saw</surname><given-names>YE</given-names> </name><name name-style="western"><surname>Buvanaswari</surname><given-names>P</given-names> </name><name name-style="western"><surname>Doshi</surname><given-names>K</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>JC</given-names> </name></person-group><article-title>Confidence in government and rumors amongst migrant worker men involved in dormitory outbreaks of COVID-19: a cross-sectional survey</article-title><source>J Migr Health</source><year>2021</year><volume>4</volume><fpage>100069</fpage><pub-id pub-id-type="doi">10.1016/j.jmh.2021.100069</pub-id><pub-id pub-id-type="medline">34664038</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lewandowsky</surname><given-names>S</given-names> </name><name name-style="western"><surname>Ecker</surname><given-names>UKH</given-names> </name><name name-style="western"><surname>Seifert</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Schwarz</surname><given-names>N</given-names> </name><name name-style="western"><surname>Cook</surname><given-names>J</given-names> </name></person-group><article-title>Misinformation and its correction: continued influence and successful debiasing</article-title><source>Psychol Sci Public Interest</source><year>2012</year><month>12</month><volume>13</volume><issue>3</issue><fpage>106</fpage><lpage>131</lpage><pub-id pub-id-type="doi">10.1177/1529100612451018</pub-id><pub-id pub-id-type="medline">26173286</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nan</surname><given-names>X</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Thier</surname><given-names>K</given-names> </name></person-group><article-title>Why do people believe health misinformation and who is at risk? A systematic review of individual differences in susceptibility to health misinformation</article-title><source>Soc Sci Med</source><year>2022</year><month>12</month><volume>314</volume><fpage>115398</fpage><pub-id pub-id-type="doi">10.1016/j.socscimed.2022.115398</pub-id><pub-id pub-id-type="medline">36327631</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rudolph</surname><given-names>J</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>S</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>S</given-names> </name></person-group><article-title>War of the chatbots: Bard, Bing Chat, ChatGPT, Ernie and beyond. The new AI gold rush and its impact on higher education</article-title><source>JALT</source><year>2023</year><volume>6</volume><issue>1</issue><fpage>364</fpage><lpage>389</lpage><pub-id pub-id-type="doi">10.37074/jalt.2023.6.1.23</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="web"><article-title>GPT-4</article-title><source>OpenAI</source><year>2023</year><access-date>2024-11-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://openai.com/research/gpt-4">https://openai.com/research/gpt-4</ext-link></comment></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Seghier</surname><given-names>ML</given-names> </name></person-group><article-title>ChatGPT: not all languages are equal</article-title><source>Nature</source><year>2023</year><month>03</month><volume>615</volume><issue>7951</issue><fpage>216</fpage><pub-id pub-id-type="doi">10.1038/d41586-023-00680-3</pub-id><pub-id pub-id-type="medline">36882613</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sallam</surname><given-names>M</given-names> </name></person-group><article-title>ChatGPT utility in healthcare education, research, and practice: systematic review on the promising perspectives and valid concerns</article-title><source>Healthcare (Basel)</source><year>2023</year><month>03</month><day>19</day><volume>11</volume><issue>6</issue><fpage>887</fpage><pub-id pub-id-type="doi">10.3390/healthcare11060887</pub-id><pub-id pub-id-type="medline">36981544</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yin</surname><given-names>Y</given-names> </name></person-group><article-title>Sample size calculation for a proof of concept study</article-title><source>J Biopharm Stat</source><year>2002</year><month>05</month><volume>12</volume><issue>2</issue><fpage>267</fpage><lpage>276</lpage><pub-id pub-id-type="doi">10.1081/bip-120015748</pub-id><pub-id pub-id-type="medline">12413244</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arain</surname><given-names>M</given-names> </name><name name-style="western"><surname>Campbell</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Cooper</surname><given-names>CL</given-names> </name><name name-style="western"><surname>Lancaster</surname><given-names>GA</given-names> </name></person-group><article-title>What is a pilot or feasibility study? A review of current practice and editorial policy</article-title><source>BMC Med Res Methodol</source><year>2010</year><month>07</month><day>16</day><volume>10</volume><fpage>67</fpage><pub-id pub-id-type="doi">10.1186/1471-2288-10-67</pub-id><pub-id pub-id-type="medline">20637084</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Qin</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Qing</surname><given-names>K</given-names> </name><name name-style="western"><surname>Songyun</surname><given-names>D</given-names> </name></person-group><article-title>An empirical study on readability calculation and application of Chinese online health education information&#x2014;a case study of food safety</article-title><source>J Mod Inf</source><year>2020</year><volume>40</volume><issue>5</issue><fpage>111</fpage><lpage>121</lpage><pub-id pub-id-type="doi">10.3969/j.issn.1008-0821.2020.05.014</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>D</given-names> </name><name name-style="western"><surname>Hu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Qian</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Ren</surname><given-names>H</given-names> </name><name name-style="western"><surname>Li</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Retrieval system for the Chinese Medical Subject Headings</article-title><source>Chin J Med Libr Inf Sci</source><year>2001</year><volume>10</volume><issue>4</issue><pub-id pub-id-type="doi">10.3969/j.issn.1671-3982.2001.04.001</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="thesis"><person-group person-group-type="author"><name name-style="western"><surname>Xianwen</surname><given-names>L</given-names> </name></person-group><article-title>Suitability Evaluation of the Health Education Text Material and the Health Literacy Intervention of Korean-Chinese Older Adults With Hypertension [Doctoral thesis]</article-title><year>2013</year><publisher-name>Yanbian University</publisher-name></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wolf</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Davis</surname><given-names>TC</given-names> </name><name name-style="western"><surname>Shrank</surname><given-names>WH</given-names> </name><name name-style="western"><surname>Neuberger</surname><given-names>M</given-names> </name><name name-style="western"><surname>Parker</surname><given-names>RM</given-names> </name></person-group><article-title>A critical review of FDA-approved Medication Guides</article-title><source>Patient Educ Couns</source><year>2006</year><month>09</month><volume>62</volume><issue>3</issue><fpage>316</fpage><lpage>322</lpage><pub-id pub-id-type="doi">10.1016/j.pec.2006.06.010</pub-id><pub-id pub-id-type="medline">16884888</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hoffmann</surname><given-names>T</given-names> </name><name name-style="western"><surname>McKenna</surname><given-names>K</given-names> </name></person-group><article-title>Analysis of stroke patients&#x2019; and carers&#x2019; reading ability and the content and design of written materials: recommendations for improving written stroke information</article-title><source>Patient Educ Couns</source><year>2006</year><month>03</month><volume>60</volume><issue>3</issue><fpage>286</fpage><lpage>293</lpage><pub-id pub-id-type="doi">10.1016/j.pec.2005.06.020</pub-id><pub-id pub-id-type="medline">16098708</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>O&#x2019;Sullivan</surname><given-names>L</given-names> </name><name name-style="western"><surname>Sukumar</surname><given-names>P</given-names> </name><name name-style="western"><surname>Crowley</surname><given-names>R</given-names> </name><name name-style="western"><surname>McAuliffe</surname><given-names>E</given-names> </name><name name-style="western"><surname>Doran</surname><given-names>P</given-names> </name></person-group><article-title>Readability and understandability of clinical research patient information leaflets and consent forms in Ireland and the UK: a retrospective quantitative analysis</article-title><source>BMJ Open</source><year>2020</year><month>09</month><day>3</day><volume>10</volume><issue>9</issue><fpage>e037994</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2020-037994</pub-id><pub-id pub-id-type="medline">32883734</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vears</surname><given-names>DF</given-names> </name><name name-style="western"><surname>Gillam</surname><given-names>L</given-names> </name></person-group><article-title>Inductive content analysis: a guide for beginning qualitative researchers</article-title><source>FoHPE</source><year>2022</year><volume>23</volume><issue>1</issue><fpage>111</fpage><lpage>127</lpage><pub-id pub-id-type="doi">10.11157/fohpe.v23i1.544</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tong</surname><given-names>W</given-names> </name><name name-style="western"><surname>Guan</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Artificial intelligence in global health equity: an evaluation and discussion on the application of ChatGPT, in the Chinese National Medical Licensing Examination</article-title><source>Front Med (Lausanne)</source><year>2023</year><volume>10</volume><fpage>1237432</fpage><pub-id pub-id-type="doi">10.3389/fmed.2023.1237432</pub-id><pub-id pub-id-type="medline">38020160</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yeo</surname><given-names>YH</given-names> </name><name name-style="western"><surname>Samaan</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Ng</surname><given-names>WH</given-names> </name><etal/></person-group><article-title>Assessing the performance of ChatGPT in answering questions regarding cirrhosis and hepatocellular carcinoma</article-title><source>Clin Mol Hepatol</source><year>2023</year><month>07</month><volume>29</volume><issue>3</issue><fpage>721</fpage><lpage>732</lpage><pub-id pub-id-type="doi">10.3350/cmh.2023.0089</pub-id><pub-id pub-id-type="medline">36946005</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>O&#x2019;Connor</surname><given-names>C</given-names> </name><name name-style="western"><surname>Joffe</surname><given-names>H</given-names> </name></person-group><article-title>Intercoder reliability in qualitative research: debates and practical guidelines</article-title><source>Int J Qual Methods</source><year>2020</year><month>01</month><day>1</day><volume>19</volume><pub-id pub-id-type="doi">10.1177/1609406919899220</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cheung</surname><given-names>KKC</given-names> </name><name name-style="western"><surname>Tai</surname><given-names>KWH</given-names> </name></person-group><article-title>The use of intercoder reliability in qualitative interview data analysis in science education</article-title><source>Res Sci Technol Educ</source><year>2023</year><month>07</month><day>3</day><volume>41</volume><issue>3</issue><fpage>1155</fpage><lpage>1175</lpage><pub-id pub-id-type="doi">10.1080/02635143.2021.1993179</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>H</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Dou</surname><given-names>Z</given-names> </name><name name-style="western"><surname>He</surname><given-names>L</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>L</given-names> </name></person-group><article-title>Performance and exploration of ChatGPT in medical examination, records and education in Chinese: pave the way for medical AI</article-title><source>Int J Med Inform</source><year>2023</year><month>09</month><volume>177</volume><fpage>105173</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2023.105173</pub-id><pub-id pub-id-type="medline">37549499</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Herrmann-Werner</surname><given-names>A</given-names> </name><name name-style="western"><surname>Festl-Wietek</surname><given-names>T</given-names> </name><name name-style="western"><surname>Holderried</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Assessing ChatGPT&#x2019;s mastery of Bloom&#x2019;s taxonomy using psychosomatic medicine exam questions: mixed-methods study</article-title><source>J Med Internet Res</source><year>2024</year><month>01</month><day>23</day><volume>26</volume><fpage>e52113</fpage><pub-id pub-id-type="doi">10.2196/52113</pub-id><pub-id pub-id-type="medline">38261378</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="web"><article-title>Chinese Dietary Guidelines</article-title><source>Chinese Nutrition Society</source><year>2022</year><access-date>2024-11-11</access-date><comment><ext-link ext-link-type="uri" xlink:href="http://dg.cnsoc.org/newslist_0402_1.htm">http://dg.cnsoc.org/newslist_0402_1.htm</ext-link></comment></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>ElSayed</surname><given-names>NA</given-names> </name><name name-style="western"><surname>Aleppo</surname><given-names>G</given-names> </name><name name-style="western"><surname>Aroda</surname><given-names>VR</given-names> </name><name name-style="western"><surname>Bannuru</surname><given-names>RR</given-names> </name><name name-style="western"><surname>Brown</surname><given-names>FM</given-names> </name><name name-style="western"><surname>Bruemmer</surname><given-names>D</given-names> </name><etal/></person-group><article-title>6. Glycemic targets: Standards of Care in Diabetes&#x2014;2023</article-title><source>Diabetes Care</source><year>2023</year><month>01</month><day>1</day><volume>46</volume><issue>Suppl 1</issue><pub-id pub-id-type="doi">10.2337/dc23-S006</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="other"><person-group person-group-type="author"><collab>Chinese Diabetes Society, National Office for Primary Diabetes Care</collab></person-group><article-title>National guidelines for the prevention and control of diabetes in primary care</article-title><year>2022</year><volume>61</volume><issue>3</issue><fpage>249</fpage><lpage>262</lpage><pub-id pub-id-type="doi">10.3760/cma.j.cn112138-20220120-000063</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kreps</surname><given-names>GL</given-names> </name><name name-style="western"><surname>Neuhauser</surname><given-names>L</given-names> </name></person-group><article-title>New directions in eHealth communication: opportunities and challenges</article-title><source>Patient Educ Couns</source><year>2010</year><month>03</month><volume>78</volume><issue>3</issue><fpage>329</fpage><lpage>336</lpage><pub-id pub-id-type="doi">10.1016/j.pec.2010.01.013</pub-id><pub-id pub-id-type="medline">20202779</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Nazir</surname><given-names>S</given-names> </name><name name-style="western"><surname>Khalil</surname><given-names>W</given-names> </name></person-group><article-title>A probabilistic approach toward evaluation of internet rumor on COVID</article-title><source>Soft comput</source><year>2022</year><volume>26</volume><issue>16</issue><fpage>8077</fpage><lpage>8088</lpage><pub-id pub-id-type="doi">10.1007/s00500-022-07064-1</pub-id><pub-id pub-id-type="medline">35528710</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Branum</surname><given-names>C</given-names> </name><name name-style="western"><surname>Schiavenato</surname><given-names>M</given-names> </name></person-group><article-title>Can ChatGPT accurately answer a PICOT question? Assessing AI response to a clinical question</article-title><source>Nurse Educ</source><year>2023</year><volume>48</volume><issue>5</issue><fpage>231</fpage><lpage>233</lpage><pub-id pub-id-type="doi">10.1097/NNE.0000000000001436</pub-id><pub-id pub-id-type="medline">37130197</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wagner</surname><given-names>MW</given-names> </name><name name-style="western"><surname>Ertl-Wagner</surname><given-names>BB</given-names> </name></person-group><article-title>Accuracy of information and references using ChatGPT-3 for retrieval of clinical radiological information</article-title><source>Can Assoc Radiol J</source><year>2024</year><month>02</month><volume>75</volume><issue>1</issue><fpage>69</fpage><lpage>73</lpage><pub-id pub-id-type="doi">10.1177/08465371231171125</pub-id><pub-id pub-id-type="medline">37078489</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cheng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Dunn</surname><given-names>M</given-names> </name></person-group><article-title>Health literacy and the internet: a study on the readability of Australian online health information</article-title><source>Aust N Z J Public Health</source><year>2015</year><month>08</month><volume>39</volume><issue>4</issue><fpage>309</fpage><lpage>314</lpage><pub-id pub-id-type="doi">10.1111/1753-6405.12341</pub-id><pub-id pub-id-type="medline">25716142</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Doak</surname><given-names>CC</given-names> </name><name name-style="western"><surname>Doak</surname><given-names>LG</given-names> </name><name name-style="western"><surname>Root</surname><given-names>JH</given-names> </name></person-group><source>Teaching Patients with Low Literacy Skills</source><year>1996</year><edition>2</edition><publisher-name>Lippincott</publisher-name></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moons</surname><given-names>P</given-names> </name><name name-style="western"><surname>Van Bulck</surname><given-names>L</given-names> </name></person-group><article-title>Using ChatGPT and Google Bard to improve the readability of written patient information: a proof of concept</article-title><source>Eur J Cardiovasc Nurs</source><year>2024</year><month>03</month><day>12</day><volume>23</volume><issue>2</issue><fpage>122</fpage><lpage>126</lpage><pub-id pub-id-type="doi">10.1093/eurjcn/zvad087</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Haver</surname><given-names>HL</given-names> </name><name name-style="western"><surname>Lin</surname><given-names>CT</given-names> </name><name name-style="western"><surname>Sirajuddin</surname><given-names>A</given-names> </name><name name-style="western"><surname>Yi</surname><given-names>PH</given-names> </name><name name-style="western"><surname>Jeudy</surname><given-names>J</given-names> </name></person-group><article-title>Use of ChatGPT, GPT-4, and Bard to improve readability of ChatGPT&#x2019;s answers to common questions about lung cancer and lung cancer screening</article-title><source>AJR Am J Roentgenol</source><year>2023</year><month>11</month><volume>221</volume><issue>5</issue><fpage>701</fpage><lpage>704</lpage><pub-id pub-id-type="doi">10.2214/AJR.23.29622</pub-id><pub-id pub-id-type="medline">37341179</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kirchner</surname><given-names>GJ</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>RY</given-names> </name><name name-style="western"><surname>Weddle</surname><given-names>JB</given-names> </name><name name-style="western"><surname>Bible</surname><given-names>JE</given-names> </name></person-group><article-title>Can artificial intelligence improve the readability of patient education materials?</article-title><source>Clin Orthop Relat Res</source><year>2023</year><month>11</month><day>1</day><volume>481</volume><issue>11</issue><fpage>2260</fpage><lpage>2267</lpage><pub-id pub-id-type="doi">10.1097/CORR.0000000000002668</pub-id><pub-id pub-id-type="medline">37116006</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jonas</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kerwer</surname><given-names>M</given-names> </name><name name-style="western"><surname>Chasiotis</surname><given-names>A</given-names> </name><name name-style="western"><surname>Rosman</surname><given-names>T</given-names> </name></person-group><article-title>Indicators of trustworthiness in lay-friendly research summaries: scientificness surpasses easiness</article-title><source>Public Underst Sci</source><year>2024</year><month>01</month><volume>33</volume><issue>1</issue><fpage>37</fpage><lpage>57</lpage><pub-id pub-id-type="doi">10.1177/09636625231176377</pub-id><pub-id pub-id-type="medline">37278009</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Scharrer</surname><given-names>L</given-names> </name><name name-style="western"><surname>Rupieper</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Stadtler</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bromme</surname><given-names>R</given-names> </name></person-group><article-title>When science becomes too easy: science popularization inclines laypeople to underrate their dependence on experts</article-title><source>Public Underst Sci</source><year>2017</year><month>11</month><volume>26</volume><issue>8</issue><fpage>1003</fpage><lpage>1018</lpage><pub-id pub-id-type="doi">10.1177/0963662516680311</pub-id><pub-id pub-id-type="medline">27899471</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>X</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>L</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>M</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>C</given-names> </name></person-group><article-title>Hot topic recognition of health rumors based on anti-rumor articles on the WeChat official account platform: topic modeling</article-title><source>J Med Internet Res</source><year>2023</year><month>09</month><day>21</day><volume>25</volume><fpage>e45019</fpage><pub-id pub-id-type="doi">10.2196/45019</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ryan</surname><given-names>L</given-names> </name><name name-style="western"><surname>Logsdon</surname><given-names>MC</given-names> </name><name name-style="western"><surname>McGill</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Evaluation of printed health education materials for use by low-education families</article-title><source>J Nurs Scholarsh</source><year>2014</year><month>07</month><volume>46</volume><issue>4</issue><fpage>218</fpage><lpage>228</lpage><pub-id pub-id-type="doi">10.1111/jnu.12076</pub-id><pub-id pub-id-type="medline">24597957</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Health rumor, misconception, and truth.</p><media xlink:href="formative_v8i1e63188_app1.docx" xlink:title="DOCX File, 17 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>The readability scores of the health essays based on rumor, misconception, and truth.</p><media xlink:href="formative_v8i1e63188_app2.docx" xlink:title="DOCX File, 19 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>The Chinese Suitability Assessment of Materials item grade distribution.</p><media xlink:href="formative_v8i1e63188_app3.docx" xlink:title="DOCX File, 475 KB"/></supplementary-material></app-group></back></article>